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□ specifier=address+(size/2)+(width /2 ) 



I depth = 4 bytes \ 



width = 16 bytes\ »A |s/Ze = depth * wid th = 64 bytes'] 



address 



address is aligned to size (64 bytes), 
so low-order 6 bits are zero 
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Qwmc.c contents 



Uwmc. pa-physical address 
Qwmc. size- size of contents 
□ wmc. cv-con ten ts valid 
Dwmc.th- thread last used 
Uwmc.reg-register last used 
Owmc.rtv-register & thread valid 
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def data,flags <- AccessPhysicalLTB(pa,op,wdata) as 
th«-pa23..i9 
en<-pa6..4 

if (en < (1 || 0 LE )) and (th < T) and (pa i8 ..6=0) then 
case op of 
R: 

_data <- 0 64 || LTBArray[th][en] 

fa: 

LocalTB[th][en] <- wdata63..o 

endcase 

else 

data <- 0 

endif 
enddef 

Fig. 16 
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def ga.LocalProtect <- LocalTranslationfth.ba.la^l) as 
if LB & (ba63..48 © I363..48) then 

raise AccessDisallowedByVlrtualAddress 

endif 

m <-NONE 
fori<-0to(1 || 0 LE )-1 

if (I363..48 & -LocalTB[th][063..48) = LocalTB[th][i]47..32 then 
me <r- i 

endif . 
endfor 

if me = NONE then 

if ~ControlRegister p i+8 then 
raise LocalTBMiss 

endif 
ga*-la 

LocalProtect <- 0 

else 

ga <- (va 6 3..48 A LocalTB[th][me] 31 .. 16 ) II va4 7 .. 0 
LocalProtect <- LocalTB[th][me]i5„o 

endif 
enddef 

Fig. 22 
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def data,flags <- AccessPhysicalGTB(pa,op,wdata) as 
th<-pa 23 ..i9+GT II 0 GT 
en<-paig„4 

if (en < (1 || 0 G )) and (th < T) and (pai 8 +GTU9 = 0) then 
case op of 
R: 

data <- GTBArray[th 5 GT][en] 

- — :W: 

GTBArray[th 5 ..GT][en] wdata 

endcase 

else 

data<-0 

endif 

enddef 

Fig. 24 
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def pa.GlobalProtect <- GlobalAddressTranslation(th,ga,pl,lda) as 
me <- NONE 
fori<-0to(1 ||0 G )-1 

if GlobalTB[th 5 .. G T][i] * 0 then 

size <- (GlobalTBlth 5 .. G T][i]63..7 and (0 64 -GlobalTB(th 5 ..GT][U63..7)) II 0 8 
'f ((ga63..8l|0 8 ) A (GlobalTB[th 5 .. G T][i]63..8ll0 8 )) and (0 64 -size)) = 0 then 
me <- GlobalTB[th5..GT]li] 

endif 

endif 
endfor 

if me = NONE then 
if Ida then 

PerformAccessDetail(AccessDetailRequiredByLocalTB) 

endif 

raise GlobalTBMiss 

else 

pa *- (ga 6 3..8 A GlobalTB[th5..GT][me] 12 7..72) II 937..0 
GlobalProtect <- GlobalTB[th 5 ..GT][me]7i.. 6 4 II 0 1 1| GlobalTB[th5..GT][me] 6 .. 0 
endif * • 
enddef 
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def GTBUpdateWrite(th f fill,data) as 
me <- NONE 
fori<-0to(1 ||0 G )-1 

size <- (GlobalTB[th 5 ..GT][i]63. J and (0 64 -GlobalTB(th 5 .. GT ][i] 63 >7 )) II 0 8 
if ((data 6 3..8l|0 8 ) A (GlobalTB[th 5 .. G T][i]63..8ll0 8 )) and (O^-size) = 0 th n 
m <- i 

endif 
endfor 

if me = NONE then 
if fill then 

GlobalTB[th5..GT][GTBLast[th 5 ..GT]] <- data 
GTBLast[th 5 ..GTl <- (GTBLast[th 5 .. G Tl + 1)<5-1..0 
if GTBLast[th 5 ..GT] = 0 then 

GTBLast[th 5 ..GTl «- GTBFirst[th 5 .. G T] 

GTBBumpfths „gt] <- 1 

endif 

endif 

else 

GlobalTB[th5 > .GT][me] <- data 

endif 
enddef 
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def data.flags <- AccessPhysicalGTBRegisters(pa,op,wdata) as 
th <- pa 2 3..i9+6T II 0 GT 
rn <- paia..8 

if (rn < 5) and (th < T) and (pais+GT..l9 = 0) and (pa7..4 = 0) then 
cas rn || op of 
0|| R.1|| R: 

data <r- 0 
0 || W, 1 || 

GTBUpdateWrite(th,rn 0 ,wdata) 
2||R: 

data «- O 64 " 6 || GTBLastIth 5 G tJ 
2||W: 

GTBLast[ths gt] «- wdatao-1 o 
3 || R: 

data <- O 64 ' 6 || GTBFirst[th 5 gt] 
3||W: 

GTBFirst[th5 gt] <- wdatao-1 o 
3 II R: 

data 0 63 1| GTBBumpphs qt] 
3||W: 

GTBBumpphs,. gt] «- wdatao 

endcase 

else 

data <- 0 

endif 
enddef 
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Ig.boolean' 



Group Boolean 



Equivalencies 



G.AAA 


Group three-way and 


G.AAA.1 


Group add add add bits 


G.AAS.1 


Group add add subtract bits 


G.ADD.1 


Group add bits 


G.AND 


Group and 


G.ANDN 


Group and not 


G.COPY 


Group copy 


G.NAAA 


Group three-way nand 


G.NAND 


Group nand 


G.NOOO 


Group three-way nor | 


G.NOR 


Group nor 


G.NOT 


Group not 


G.NXXX 


Group three-way exclusive-nor 


G.000 


Group three-way or 


G.OR 


Group or 


G.ORN 


Group or not 


G.SAA.1 


Group subtract add add bits 


G.SAS.1 


Group subtract add subtract bits 


G.SET 


Group set 


G.SET.AND.E.1 


Group set and equal zero bits 


G.SET.AND.NE.1 


Group set and not equal zero bits 


G.SET.E.1 


Group set equal bits 


G.SET.G.1 


Group set greater signed bits 


G.SET. G.U.1 


Group set greater unsigned bits 


G.SET.G.Z.1 


Group set greater zero signed bits I 


G.SET.GE.1 


Group set greater equal signed bits | 


G.SET.GE.Z.1 


Group set greater equal zero signed bits 


G.SET.L1 


Group set less signed bits j 


G.SET.LZ.1 


Group set less zero signed bits j 


G.SET.LE.1 


Group set less equal signed bits 


G.SET.LE.U.1 


Group set less equal unsigned bits 


G.SET.LE.Z.1 


Group set less equal zero signed bits 


G.SET.NE.1 — . 


Group set not equal bits 


G.SET.GE.U.1 


Group set greater equal unsigned bits 


G.SET.LU.1 ! 


Group set less unsigned bits 



Fig. 31 A 



G.SSA.1 


Group subtract subtract add bits 


G.SSS.1 


Group subtract subtract subtract bits 


G.SUB.1 


Group subtract bits 


G.XNOR 


Group xclusive-nor j 


G.XOR 


Group exclusive-or 


G.XXX 


Group three-way exclusive-or 


G.ZERO 


Group zero 



G AAA rri(rf)rr rh 


<— 


VjlDvJULc/MN ru(gjrC f rD,UD1 UUUUUUU 


G AAA 1 rd(a)rc rh 


— > 


CX YYY rH/T^m rK 


G AAS 1 rd(a)rr rh 


— > 


f5 YYY rH/77WA rK 


G ADD 1 rd=rr rh 


— > 


vj.AUK ru— iCjiD 


G AND rri—rr rh 


<— 




G ANDN rd=rc rh 


<— 


o.duulcan ra^Ggrc^D.ODOioooioo 


G BOOLEAN rrftrhrh rr i 


—> 


l_ LJ flfil | - A M /f*d\ ■ !_!.! - J _ ! . !_ I _ 

o.DUULtAiM raQGgrc v rD t i7i5i6i4i3il >2>0 


fl PHP V rrl—rn 


<- 


r^ D^^^^l P A M 1 /?v _ AAAi AAA 

G. BOOLEAN rd@rc,rc,0b1 0001 000 


a MA A A rrlfrhrr* rh 


<- 


Q/"\/"\l CAM — . _t_. f\\^f\A A A A A A A 

G. BOOLEAN rd@rc,rb,0b01 111111 


{2 AM KID rrl—rn rh 


^ 


r* D r\r\l r" A M «J/Sv» — *- y\L Aj< «i j ni <4 ^ 1 

G.BOOLEAN rd@rc,rb,0b01 1 101 1 1 j 


{2 A/OnD rr4(r7\rr* rh 


<- 


r* r% r\ r*\ i r~ a kl acaaaaaaa^ 

G.BOOLEAN rd@rc f rb,0b00000001 


G NOR rri—rr rh 


<- 


/"^ D /^/^l CAM atJ/S^M -1- r\i_ A A A A /\ f\f\ A 

G.BOOLEAN rd@rc,rb,0b000 10001 j 


G NOT rri-rr 


<— 


r^ P /"\/"\| CAM .J — — ^ . ALAAA4 AAA4 

G.BOOLEAN rd@rc > rc,0b00010001 


n NYYY rrlfrftrn rh 


<- 


G.BOOLEAN rd@rc,rb,0b01101001 




<- 


["1 /""\/"\| AM 1 /2i _ t, ^ \^ A A A A A A A f\ 

G.BOOLEAN rd@rc,rb,0b1 1111110 


G.OR rd=rc,rb 




G BOOLEAN rd(S)rr rh0h11ini1in 


G.ORN rd=rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b1 101 1101 


G.SAA.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb [ 


G.SAS.1 rd@rc,rb 


-» 


G.XXX rd@rc,rb 


G.SETrd 


<- 


G.BOOLEAN rd@rd,rd,0b1 0000001 


G.SET.AND.E.1 rd=rb,rc 


-> 


G.NAND rd=rc,rb 


G.SET.AND.NE.1 rd=rb,rc 


-> 


G.AND rd=rc,rb | 


G.SET.E.1 rd=rb,rc 


-> 


G.XNOR rd=rc,rb 1 


G.SET.G.1 rd=rb,rc 


-> 


G.ANDN rd=rc,rb 


G.SET.G.U.1 rd=rb,rc 


-» 


G.ANDN rd=rb,rc 


G.SET.G.ZPrd=rc 


-> 


G.ZERO rd A 


G.SET.GE.1 rd=rb,rc 


-> 


G.ORN rd=rc,rb 


G.SET.GE.Z.1 rd=rc 


-> 


G.NOTrd=rc 



Fig. 31 A (cont'd) 



G.SET.L 1 rd~rb,rc 


-> 


G.ANDN rd=rb,rc 


G.SET.LZ.1 rd=rc 


-» 


G.COPY rd=rc 


G.SET.LE.1 rd=rb,rc 


-> 


G.ORN rd=rb,rc j 


G.SET.LE.U.1 rd=rb,rc 




G.ORN rd=rc,rb 


G.SET.LE.Z.1 rd=rc 




G.SET rd 


G.SET.NE.1 rd=rb,rc 


-> 


G.XOR rd=rc,rb 


G.SET.GE.U.1 rd=rb,rc 


-> 


G.ORN rd=rb,rc 


G.SET.L U. 1 rd=rb,rc 


-> 


G.ANDN rd=rc,rb 


G.SSA.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SSS.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SUB.1 rd=rc,rb 




G.XOR rd=rc,rb 


G.XNOR rd=rc,rb 


<- 


G.BOOLEAN rd@rc,rb,0b1 001 1001 


G.XOR rd=rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b01100110 


G.XXX rd@rc,rb 


<— 


G.BOOLEAN rd@rc,rb,0b10010110 


G.ZERO rd 


<- 


G.BOOLEAN rd@rd,rd,0b00000000 



Selection 



operation 


function (binary) 


function (decimal) 
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11110000 


240 
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11001100 


204 
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10101010 


176 


d&c&b 


10000000 


128 


(d&c)|b 


11101010 


234 j 


d|c|b 


11111110 


254 


d?c:b 


11001010 


202 


d^b 


10010110 


150 


~d A c A b 


01101001 


105 
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00000000 


0 



Fig. 31A (cont'd) 



Format 

G.BOOLEANrd@trc,trb,f 
rd=gbooleani(rd,rc,rb,f) 

31 252423 18 17 12 11 6 5 

| g.boolean |jh| rd | rc I rb | il 

7 1 6 6 6 6 

if f6=fs then 

if f2=f 1 then 

if f2 then 

rc <- max(trc,trb) 
rb «- min(trc,trb) 

else 

rc «- min(trc,trb) 
rb <- max(trc,trb) 

end if 
ih<-0 

il<-0||f6||f7||f4l|f3l|f0 



else 



else 



if f2 then 

rc <- trb 
rb <r- trc 

else 

rc *- trc 
rb <- trb 

endif 
ih<-0 

il<-1||f6||f 7 ||f4l|f3l|f0 



endif 



ih<-1 
if f6 then 

rc -e- trb 

rb<-trc 

il<-fll|f2l|f7l|f4l|f3l|fo 

else 

rc <- trc 
rb«-trb 

il<-f2l|fl I|f7||f4l|f3l|f0 

endif 



endif 



Definition 

def GroupBoolean (ih.rd.rcrb.il) 
d <~ RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
if ih=0 then 

if il5=0 then 

f<-il3 II >4 II "4 II H 2 II Hi II (rc>rt»2 || il 0 

else 

^ f^H3lMUHil4l|il2l|ill IIO||1||il 0 
end if 

else 

f<-l3l|0||1||l2l|Hi||l 5 ||l4||lo 

end if 

fori<-Oto 127 by size 

ai<-f(di||q||bi) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

none 



Fig. 31C 



Operation code 



I G.MUX 1 Group multiplex 



Redundanci s 



G.MUX ra=rd,rc,rc 




G.COPY ra=rc 


G.MUX ra=ra,rc,rb 


<=> 


G.BOOLEAN ra@rc,rb,0x1 1001010 


G.MUX ra=rd,ra,rb 




G.BOOLEAN ra@rd,rb,0x1 11 00010 


G.MUX ra=rd,rc,ra 


<=> 


G.BOOLEAN ra@rd,rc,0x1 101 1000 


G.MUX ra=rd,rd,rb 


o 


G.OR ra=rd,rb 


G.MUX ra=rd,rc,rd 


<=> 


G.AND ra=rd,rc 



Format 



G.MUX ra=rd,rc,rb 
ra=gmux(rd,rc,rb) 

31 24 23 18 17 12 11 6_5 0 

I G.MUX | rd j rc | rb | ra I 

8 6 6 6 6 

Fig. 31D 



Definition 

def GroupTemaryfop^ize.rd.rc.rb.ra) as 
d +- RegRead(rd, 128) 
c «- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 
G.MUX: 

a <- (c and d) or (b and not d) 

endcase 

RegWrite(ra. 128 f a) 
enddef 

Exceptions 

none 

Fig. 31D 
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G ADD 128 O 


GrouD add sianed hexlet check overflow 

1 V/VI »/ 14\JM WlMI IWM 1 ■ W/AI W • V* > 1 WVI\ ▼ ■ 1 IV ft 


G.ADD.U.8.0 


Group add unsigned bytes check overflow 


G.ADD.U.16.0 


Group add unsigned doublets check overflow 


G.ADD.U.32.0 


Group add unsigned quadlets check overflow 


G.ADD.U.64.0 


Group add unsigned octlets check overflow 


G.ADD.U.128.0 


Group add unsigned hexlet check overflow 



Fig. 32A 



Format 



G.op.size rd=rc,rb 
rd=gopsize(rc,rb) 

31 24 23 18 17 12 11 65 0 

I G.size | rd | rc I rb | op ~| 

8 6 6 6 6 



Fig. 32B 



Definition 



def Group(op f size,rd f rc f rb) 
c<- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 
G.ADD: 

for i <- 0 to 128-size by size 

ai+size-1..i «- Ci+size-1..i + b|+ S ize-1.J 
endfor 
G.ADD.L: 

for i <- 0 to 128-size by size 

t «- (Ci+slze-1 II Cj+size-1..i) + (bj+size-1 II bj+size-1 ..i) 

ai+size-1.J «- (tsize * Wi) ? (t size || t|j|g:^ ) : t sjze -i..o 
endfor 
G.ADD.L.U: 

for i «- 0 to 1 28-size by size 

t <- (0 1 || c i+siz e-i .j) + (0 1 || bj+size-1 ..i) 

aj+size-1..i «- (tsize * 0) ? (1*™) : W1..0 
endfor 
G.ADD.O: 

for i <- 0 to 128-size by size 

t <- (Cj +S | ze .i || q+size-1 ..i) + (bi+size-1 II bj+size-1 ■ J) 
if t$jze * t s j ze _f then 

raise FixedPointArithmetic 

end if 

a i+size-1..i <- tsize-1..0 
endfor 
G.ADD. U.O: 

for i <- 0 to 1 28-size by size 

t <- (0 1 || c i+S ize-1..i) + (0 1 || b i+S ize-1..i) 
if tsize * 0 then 

raise FixedPointArithmetic 

end if 

a i+size-1..i <- tsize-1..0 
endfor 

endcase 

RegWrite(rd, 128,a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 32C 



Operation codes 



G.SET.AND.E.8 


Group set and equal zero bytes 


G.SET.AND.E.16 


Group set and equal zero doublets 


G.SET.AND.E.32 


Group set and equal zero quadlets 


G.SET.AND.E.64 


Group set and equal zero octlets 


G.SET.AND.E.128 


Group set and equal zero hexlet 


G.SET.AND.NE.8 


Group set and not equal zero bytes 


G.SET.AND.NE.16 


Group set and not equal zero doublets 


G.SET.AND.NE.32 


Group set and not equal zero quadlets j 


G.SET.AND.NE.64 


Group set and not equal zero octlets 


G.SET.AND.NE.1 28 


Group set and not equal zero hexlet 


G.SET.E.8 


Group set equal bytes 


G.SET.E.16 


Group set equal doublets 


G.SET.E.32 


Group set equal quadlets 


G.SET.E.64 


Group set equal octlets 


G.SET.E.128 


Group set equal hexlet 


G.SET.GE.8 


Group set greater equal signed bytes 


G.SET.GE.16 


Group set greater equal signed doublets 


G.SET.GE.32 


Group set greater equal signed quadlets 


G.SET.GE.64 


Group set greater equal signed octlets 


G.SET.GE.128 


Group set greater equal signed hexlet 


G.SET.GE.U.8 


Group set greater equal unsigned bytes 


G.SET.GE.U.16 


Group set greater equal unsigned doublets 


G.SET.GE.U.32 


Group set greater equal unsigned quadlets 


G.SET.GE.U.64 


Group set greater equal unsigned octlets 


G.SET.GE.U.128 


Group set greater equal unsigned hexlet 


G.SET.L.8 


Group set signed less bytes 


G.SET.L.16 


Group set signed less doublets 


G.SET.L.32 


Group set signed less quadlets 


G.SET.L.64 


Group set signed less octlets 


G.SET.L.128 


Group set signed less hexlet 


G.SET.LU.8 


Group set less unsigned bytes 


G.SET.LU.16 


Group set less unsigned doublets 


G.SET.L.U.32 


Group set less unsigned quadlets 


G.SET.LU.64 


Group set less unsigned octlets 


G.SET.LU.128 


Group set less unsigned hexlet 


G.SET.NE.8 


Group set not equal bytes 


G.SET.NE.16 


Group set not equal doublets 



Fig. 33A 



G SET NE 32 


GrouD set not poual nuadlets 


G SET NE 64 


GrouD set not eoual octlets 


G SET NE 128 


GrotiD set not eoual hexlet 

V^l VWW Wwl 1 IVI WNJ W/Wil V IVAIw* 


G SUB 8 


GrouD subtract bvtes 


G SUB 8 O 


f^rnun suhtrapt Qinnpri hvtps phppk nv/prflow 

VJIUUp OUULIOwl wlvj 1 ICU UYICO vl iCUl\ UVCi 1 IUW 


G SUB 16 


GrouD subtract doublets 


G SUB 16 O 


f^rnun snhtrapt Qinnpri dnnhlptQ phppk ox/prflnxA/ 

vl UU|J OUUU dU OlU,l ICU UUUUIClo Vyl UVCI llUW 


G SUB 32 

W. O ULJ.U<c. 


GrouD subtract nuadlets 


G SUB 32 O 


f^roun suhtrapt tinned nuadlpts phppk nvprflnw 

VJIvUp OUUUCIV/l wl^ 1 ICU IjUCIUICld Ul ICvi\ UVCIItwW 


G SUB 64 


Grouo subtract optlets 

1 w w. U wUUU MVi WwUwlw 


G SUB 64 O 


r^rnim suhtract Qinnpri npflpfQ phopk pi\/orfln\A/ 

vl UUp wUUlldwl wlU,l ICu UOUCld Ul ICUIx UVCI MUW 


G SUB 128 


GrouD subtract hexlet 


G SUB 128 O 


fnroiin Qiihtrarf sinneri hpylpf phppk n\/P rflnw 

vlUUp OUUU Owl Ol^llCU 1 ICAICl Ul ICUf\ UVCI 1 IU w 


G SUB L 8 


Grouo subtract limit sianed bvtes 

wl WU|i/ WwwWI wtwV 111111% wImI Iw W/ WJ w 4ww 


G SUB 116 


Grouo subtract limit sinned doublets 

VIUUM wuuuav/i III 1 111 Ol^l ICU UvUUIvlO 


G SUB L 32 


Grouo subtract limit sinned nuadlets 

VI wU|/ wUWU Wlwi III 1 111 wl VJ 1 1 w w uuauivio 


G SUB L 64 

v> >UUU,L. U*T 


Grouo subtract limit sinned octlets 

VI will/ wUUU Qvl llll 111 wlUI IvU vwllvlw 


G SUB L 128 

V .UUU.L. 1 ^.U 


Grouo subtract limit sinned hexlpt 

VI WU|/ vUVII Qvl llll 111 wlUI IwU I IvAICI 


G SUB L U 8 


Grouo subtract limit unsioned bvtes 

wl VUm vUVlluvl III llll Ul IwlUl IwU UJflvw 


G SUB L U 16 


Grouo suhtract limit unsinned dnuhlets 

vlUUf/ OUUU CJ wl III llll Ul IOIU,l IvU vlUUUIvlw 


G SUB L U 32 


Grouo suhtract limit unsinnpd nuadlets 

V— » I \J\jyj OUUUQvi III lift Ul IwlUI IwU VjUwUIClO 


G SUB L U 64 


Grouo subtract limit unsinned octlets 

V«#l \J\JyJ wUUllwJwl III llll Ul IwlUI IwU w wll w lw 


G SUR I I J 128 


Grouo suhtract limit unsinned hpylpt 

WIUUp OUUU uvl III llll Ul IwlUI IvU 1 IvAICl 


G SUB U 8 O 


f^roi in ci ihtrnf*t iincinnoH Kvtoc phppk n\/orfln\A/ 
oiuup oiiuudu uiioiyiicu uyico uiicur uvciiiuw 


G.SUB.U.16.0 


Group subtract unsigned doublets check overflow 


G.SUB.U.32.0 


Group subtract unsigned quadlets check overflow 


G.SUB.U.64.0 


Group subtract unsigned octlets check overflow 


G.SUB.U.128.0 


Group subtract unsigned hexlet check overflow 



Fig. 33A (cont'd) 



Equivalenci s 



G.SET.E.Z.8 


Group set equal zero bytes 


G.SET.E.Z16 


Group set equal zero doublets 


G.SET.E.Z.32 


Group set equal zero quadlets 


G.SET.E.Z.64 


Group set equal zero octlets 


G.SET.E.Z.128 


Group set equal zero hexlet 


G.SET.G.Z.8 


Group set greater zero signed bytes 


G.SET.G.Z.16 


Group set greater zero signed doublets 


G.SET.G.Z.32 


Group set greater zero signed quadlets 


G.SET.G.Z.64 


Group set greater zero signed octlets 


G.SET.G.Z128 


Group set greater zero signed hexlet 


G.SET.GE.Z.8 


Group set greater equal zero signed bytes 


G.SET.GE.Z.16 


Group set greater equal zero signed doublets 


G.SET.GE.Z.32 


Group set greater equal zero signed quadlets 


G.SET.GE.Z.64 


Group set greater equal zero signed octlets 


G.SET.GE.Z128 


Group set greater equal zero signed hexlet 


G.SET.LZ8 


Group set less zero signed bytes 


G.SET.LZ.16 


Group set less zero signed doublets 


G.SET.L.Z.32 


Group set less zero signed quadlets 


G.SET.LZ.64 


Group set less zero signed octlets 


G.SET.L.Z.128 


Group set less zero signed hexlet 


G.SET.LE.Z.8 


Group set less equal zero signed bytes 


G.SET.LE.Z.16 


Group set less equal zero signed doublets 


G.SET.LE.Z.32 


Group set less equal zero signed quadlets 


G.SET.LE.Z.64 


Group set less equal zero signed octlets 


G.SET.LE.Z.128 


Group set less equal zero signed hexlet 


G.SET.NE.Z8 


Group set not equal zero bytes 


G.SET.NE.Z16 


Group set not equal zero doublets 


G.SET.NE.Z32 


Group set not equal zero quadlets 


G.SET.NE.Z.64 


Group set not equal zero octlets 


G.SET.NE.Z.128 


Group set not equal zero hexlet 



Fig. 33A (cont'd) 



6 SETLE.8 


Group set less equal signed bytes 


G SETLE.16 


Group set less equal signed doublets 


G SET.LE.32 


Group set less equal signed quadlets 


G SET.LE.64 


Group set less equal signed octlets 


GSET.LE.f28 


Group set less equal signed hexlet 


G SETLE.U.8 


Group set less qual unsigned bytes 


G.SET.LE.U.16 


Group set less equal unsigned doublets 


G SET.LE.U.32 


Group set less equal unsigned quadlets 


G SET LE.U.64 


Group set less equal unsigned octlets 


G SET LE U 128 


Group set less equal unsigned hexlet 


G SET G 8 


Group set signed greater bytes 


G.SET.G.16 


Group set signed greater doublets 


G.SET.G.32 


Group set signed greater quadlets 


G.SE7.G.64 


Group set signed greater octlets 


G.SET.G.f28 


Group set signed greater hexlet 


G SET.G.U.8 


Group set greater unsigned bytes 


G.SET.G.U.16 


Group set greater unsigned doublets 


G.SET.G.U.32 


Group set greater unsigned quadlets 


G.SET.G.U.64 


Group set greater unsigned octlets 


G.SET.G.U.128 


Group set greater unsigned hexlet 




G.SET.E.Zsize rd=rc 


<- G.SET.AND.E.size rd=rc,rc [ 


G.SET.G.Z.size rd=rc 


<= G.SET.L.U.size rd=rc,rc 


G. SET. GE. Z. size rd=rc 


<= G.SET.GE.size rd=rc,rc 


G.SET.L.Z.size rd=rc 


<= G.SET.L.size rd=rc,rc 


G.SET.LE.Zsize rd-rc 


<= G.SET.GE.U.size rd=rc,rc 


G.SET.NE.Z.size rd=rc 


<r- G.SET.AND.NE.size rd=rc,rc 


G.SETG.size rd=rb,rc 


-> G.SET.L.size rd=rc,rb 


G.SET.G.U.size rd=rb,rc -> G.SET.L.U.size rd=rc,rb 


G.SET.LE.size rd=rb,rc 


-> G.SET.GE.size rd=rc,rb 


G.SET.LE.U.size rd=rb,rc -» G.SET.GE.U.size rd=rc,rb 



Fig. 33A (cont'd) 



Format 



G.op.size rd=rb,rc 
rd=gopsize(rb,rc) 

31 24 23 18 17 12 11 65 0 

I G.size | rd | rc | rb | op | 

8 6 6 6 6 



Fig. 33B 



Definition 

def GroupReversed(op,siz ,rd,rc,rb) 
c <- RegRead(rc t 128) 
b <- RegRead(rb, 128) 
case op of 
G.SUB: 

for i <- 0 to 128-size by size 

a i+size-1 ..i <- bi+size-1 ..i - Ci+size-1 ..i 
endfor 
G.SUB.L: 

for i ^- 0 to 128-size by size 

t <- (bi+size-1 II bi+size-1..i) - (cj+size-1 II Q+size-1 ..i) 

ai+size-1. .i <- (tsize * t S ize-l) ? (tsize II tijf§:1) : t S ize-1..0 
endfor 
G.SUB.LU: 

for i «- 0 to 128-size by size 

t <- (0 1 || b j+S ize-1..i) - (0 1 II q+size-U) 

a|+size-1..i «- (tsize * 0) ? 0 slze : t S |ze-1..0 
endfor 
G.SUB.O: 

for i <- 0 to 1 28-size by size 

t <- (bj+size-1 II bi+size-1..i) " ta+size-1 II Cj+ S ize-1..i) 
if (tsize ^size-l) then 

raise FixedPointArithmetic 

endif 

ai+size-1J^t S i ze -i..o 
endfor 
G.SUB.U.O: 

for i <- 0 to 128-size by size 

t <- (0 1 || bj+size-Lj) - (0 1 || c i+S ize-1..i) 
if (tsize * 0) then 

raise FixedPointArithmetic 

endif 

aj+size-1 ..j <- tsize-1 ..0 
endfor 
G.SET.E: 

for i +- 0 to 1 28-size by size 

aj+size-1 ..» «- (&i+size-1..i a Cj+size-1 ..i) size 
endfor 
G.SET.NE: 

for i <- 0 to 128-size by size 

* -af+size-1 ..i <r (bj+size-1 ..i * Cj +S j ze -1 j) slze 
endfor 
G.SET.AND.E: 

for i <- 0 to 128-size by size 

ai+size-1. .i *- ((&i+size-1..i and q+ S ize-1..i) = 0) s,ze 
endfor 

Fig. 33C 



G.SET.AND.NE: 

for i <- 0 to 1 28-siz by siz 

ai+size-1..i «- ((&i+size-1..i and Cj+ S ize-1..i) * 0) size 
endfor 
G.SET.L: 

for i <- 0 to 1 28-siz by size 

ai+size-1..i «- ((re = rb) ? (bi+ S ize-1.J < 0) • (bi+size-1 ..i < Cj+ S ize-1..i)) size 
endfor 
G.SET.GE: 

for i <- 0 to 128-size by size 

ai+size-1..i <- ((rc = rb) ? (bi+ S jze-1.j °) • (bi+size-1..i * Ci +S j ze .i j)) size 
endfor 
G.SET.LU: 

for i <- 0 to 128-size by size 

ai+size-1..i *- ((rc = rb) ? (bj+ s ize-1..i > 0) • 
((0 || bi+size-u) < (0 || q +S ize-1..i))) s * e 

endfor 
G.SET.GE.U: 

for i <- 0 to 128-size by size 

ai+size-l..i «- ((re = rb) ? (b i+S lze-1.J * 0) : 
((O||bi +S i Z e-i..i)^(O||q +siZ e-i.j))) slz0 

endfor 

endcase 

RegWrite(rd, 128, a) 
nddef 



Exceptions 

Fixed-point arithmetic 



Fig. 33C (cont'd) 



E.DIV.64 


Ensemble divide signed octlets 


E.DIV.U.64 


Ensemble divide unsigned octlets 


E.MUL8 


Ens mble multiply signed bytes 


E.MUL16 


Ensemble multiply signed doublets 


E.MUL32 


Ensemble multiply signed quadlets 


E.MUL64 


Ensemble multiply signed octlets 


E.MULSUM.8 


Ensemble multiply sum signed bytes 


E.MULSUM.16 


Ensemble multiply sum signed doublets 


E.MULSUM.32 


Ensemble multiply sum signed quadlets 


E.MUL.SUM.64 


Ensemble multiply sum signed octlets 


E.MUL.C.8 


Ensemble complex multiply bytes 


E.MUL.C.16 


Ensemble complex multiply doublets 


E.MUL.C.32 


Ensemble complex multiply quadlets 


E.MULM.8 


Ensemble multiply mixed-signed bytes 


E.MULM.16 


Ensemble multiply mixed-signed doublets 


E.MULM.32 


Ensemble multiply mixed-signed quadlets 


E.MULM.64 


Ensemble multiply mixed-signed octlets 


E.MULP.8 


Ensemble multiply polynomial bytes J 


E.MULP.16 


Ensemble multiply polynomial doublets 


E.MULP.32 


Ensemble multiply polynomial quadlets 


E.MULP.64 


Ensemble multiply polynomial octlets 


E.MULSUM.C.8 


Ensemble multiply sum complex bytes 


E.MUL.SUM.C.16 


Ensemble multiply sum complex doublets 


E.MULSUM.C.32 


Ensemble multiply sum complex quadlets 


E.MULSUM.M.8 


Ensemble multiply sum mixed-signed bytes 


E.MULSUM.M.16 


Ensemble multiply sum mixed-signed doublets j 


E.MUL.SUM.M.32 


Ensemble multiply sum mixed-signed quadlets 


E.MULSUM.M.64 


Ensemble multiply sum mixed-signed octlets 


E.MULSUM.U.8 


Ensemble multiply sum unsigned bytes 


E.MULSUM.U.16 


Ensemble multiply sum unsigned doublets 


E.MUL.SUM.U.32 


Ensemble multiply sum unsigned quadlets 


E.MULSUM.U.64 


Ensemble multiply sum unsigned octlets 


E.MULU.8 


Ensemble multiply unsigned bytes 


E.MULU.16 


Ensemble multiply unsigned doublets 


E.MULU.32 


Ensemble multiply unsigned quadlets 


E.MULU.64 


Ensemble multiply unsigned octlets 



Fig. 34A 



Format 

E.op.size rcNrc.rb 
rd=eopsize(rc,rb) 

31 24 23 18 17 12 11 65 0 

| E.size | rd | rc | rb | op | 

8 6 6 6 6 



Fig. 34B 



Definition 



def muKslze^vs.v.i.ws.wj) as 

mul <- ((vs&v sjze .i + i) h - slze II v size -i + i;.i) * ((ws&w size -i + j) h ' sl2e || w size -i + j..j) 
enddef 

def c <- PolyMultiply(size.a.b) as 

pIOl^O 2 *^ 
for k <- 0 to size-1 

p[k+1] 4- p[k] A a k ? (fjsize-k jj b ( | 0 k) . 0 2*size 

endfor 
c 4- p[size] 
enddef 

def Ensemb!e(op,$ize,rd,rc,rb) 
c 4- RegRead(rc t 128) 
b 4- RegRead(rt), 128) 
case op of 

E.MUL:, E.MULC:, EMULSUM, E.MULSUM.C. E.CON, E.CON.C, E.DIV: 

cs <- bs 4- 1 
E.MULM:, EMUL.SUM.M, E.CON.M: 

CS 4- 0 

DS4-1 

E.MULU:, EMULSUM.U, E.CON.U, E.DIV.U, E.MUL.P: 
cs <- bs <- 0 

endcase 
case op of 

E.MUL, E.MULU, E.MUL. M: 

for i 4- 0 to 64-size by size 

d2*(i+size)-1..2*i «- mul(size,2*size,cs,c,i,bs,b,i) 

endfor 
E.MULP: 

for i 4- 0 to 64-size by size 

d2*(i+size)-1..2*i «- PolyMultjply(size,c S j ze .i+i..i,b s i Z e-i+j..i) 

endfor 
E.MUL.C: 

for i 4- 0 to 64-size by size 
if (i and size) = 0 then 

p 4- mul(size.2*size,1,c,i ( 1,b,i)- mul(size,2*size,1,c f i+size,1,b,i+size) 

else 

p 4- muKsize^sizeAci.l.b.i+size) + mul(size,2*size,1,c,i,1,b,i+size) 

endrf 

d2*(i+size)-1..2*i<-P 

endfor 

E.MUL.SUM, E.MULSUM.U, E.MUL.SUM.M: 
p[0]4-0 128 

for i 4- 0 to 1 28-size by size 

pp+size] 4- p[i] + mul(size,128,cs,c,i,bs,b,i) 

endfor 
a 4- p[128] 
E.MULSUM.C: 

PI014-0 64 
p[size] 4- 0 64 

for i 4— 0 to 1 28-size by size 
if (i and size) = 0 then 

pp+2*size] 4- p[i] + mul(size,64,1,c,i,1,b,i) 

- mul(size,64,1 ,c,i+size t 1 ,b,i+size) 

else 

pp+2*size] 4- p[i] + mul($ize,64 l 1,c t i.1.b,l+size) 

+ mul(size,64,1 .ci+size.1 ,b,i) 

endif 

endfor 

3 4-p[128+siz ]||p[128] 

Fig. 34C 



E.CON, E.CON.U, E.CON.M: 
p[0]<-0 128 

forj <- 0to64-siz bysize 

for i <- 0 to 64-size by size 

pD+slzel^fl+size)-!.^*! «- PlD2*(i+size>-1..2*i + 
mul(siz ,2*size,cs,c,i+64-|,bs ( bj) 

endfbr 

endfor 
a <- p[64] 
E.CON.C: 

p[0]<-0 128 

for j 4- 0 to 64-size by size 

for i <- 0 to 64-size by size 

if ((H) and j and size) = 0 then 

p0+size]2*(i+size)-1..2*i «- PtD2*(i+size)-1»2*i 
mul(size,2*slze, 1 ,c,i+6H t ,bj) 

else 

pO+sizeJ^fi+size)-!.^ «- Pfll2*0+size).1..2*i 
mul(size,2*size,1 ,c,i+64-j+2*size t 1 ,b j) 

endif 

endfor 

endfbr 
a <- p[64] 

E.DIV: 

if (b = 0) or ( (c = (1H0 63 )) and (b = 1 64 ) ) then 
a «- undefined 

else 

q«-c/b 
r «~ c - q*b 
a«-r63..0 UQ63..0 

endif 
E.DIV.U: 

ifb = 0then 

a «- undefined 

else 

q<-(0||c)/(0||b) 
r^c-(0|I q)*(0 1| b) 
a «- r 63..0 II P63..0 

endif 

endcase 

RegWrite(rd, 128, a) 
nddef 



Exceptions 

none 



Fig. 34C (cont'd) 



G.C0M.AND.E.8 


Group compare and equal zero bytes 


G.C0M.AND.E.16 


Group compare and equal zero doublets 


G.COM.AND.E.32 


Group compare and equal zero quadlets 


G.COM.AND.E.64 


Group compare and equal zero octlets 


G.COM.AND.E.128 


Group compare and equal zero hexlet 


G.C0M.AND.NE.8 


Group compare and not equal zero bytes 


G.C0M.AND.NE.1 6 


Group compare and not equal zero doublets 


G.COM.AND.NE.32 


Group compare and not equal zero quadlets 


G.COM.AND.NE.64 


Group compare and not equal zero octlets 


G.COM.AND.NE.128 


Group compare and not equal zero hexlet 


G.C0M.E.8 


Group compare equal bytes 


G.C0M.E.16 


Group compare equal doublets 


G.COM.E.32 


Group compare equal quadlets 


G.COM.E.64 


Group compare equal octlets 


G.COM.E.128 


Group compare equal hexlet 


G.C0M.GE.8 


Group compare greater equal signed bytes 


G.C0M.GE.16 


Group compare greater equal signed doublets 


G.COM.GE.32 


Group compare greater equal signed quadlets 


G.COM.GE.64 


Group compare greater equal signed octlets 


G.COM.GE.128 


Group compare greater equal signed hexlet 


G.C0M.GE.U.8 


Group compare greater equal unsigned bytes 


G.C0M.GE.U.16 


Group compare greater equal unsigned doublets 


G.COM.GE.U.32 


Group compare greater equal unsigned quadlets 


G.COM.GE.U.64 


Group compare greater equal unsigned octlets 


G.COM.GE.U.128 


Group compare greater equal unsigned hexlet 


G.C0M.L.8 


Group compare signed less bytes 


G.C0M.L.16 


Group compare signed less doublets 


G.COM.L.32 


Group compare signed less quadlets 


G.COM.L64 


Group compare signed less octlets 


G.COM.L128 


Group compare signed less hexlet 


G.C0M.LU.8 


Group compare less unsigned bytes 


G.C0M.LU.16 


Group compare less unsigned doublets 


G.COM.L.U.32 


Group compare less unsigned quadlets 


G.COM.LU.64 


Group compare less unsigned octlets 


G.COM.LU.128 


Group compare less unsigned hexlet 


G.C0M.NE.8 


Group compare not equal bytes 


G.C0M.NE.16 


Group compare not equal doublets 


G.COM.NE.32 


Group compare not equal quadlets 


G.COM.NE.64 


Group compare not equal octlets 


G.COM.NE.128 


Group compare not equal hexlet 



Fig. 35A 



Format 



G.COM.op.size rd.rc 
G.COM.opz.size red 

gcomopsize(rd.rc) 

31 24 23 18 17 12 11 6 5 0 

I G.size | rd | rc | op | GCOM I 

8 6 6 6 6 



Fig. 35B 



D finition 

def GroupComparefop.size.rd^c) 
d <- RegRead(rd, 128) 
c «- RegRead(rc, 128) 
case op of 

G.COM.E: 

for i <— 0 to 128-size by size 

a|+size-1..i <- (di+size-1..i = q+size-1..i) size 
endfor 
G.COM.NE: 

for i <- 0 to 1 28-size by size 

ai+size-1..i <- (dj+size-U * Cj +S ize-1..i) s,ze 
endfor 
G.COM.AND.E: 

for i <- 0 to 1 28-size by size 

ai+size-1..i «- ((q+size-1..i and dj+ S j ze -i j) = 0) slze 
endfor 
G.COM.AND.NE: 

for i <- 0 to 1 28-size by size 

aj+size-1..i <- ((q+size-1..i and dj +S ize-U) * 0) size 
endfor 
G.COM.L: 

for i <- 0 to 128-size by size 

ai+size-1..l <- ((rd = rc) ? (Ci +S j ze -i..j < 0) : (dj +s j ze _i..j < Cj+ske-u)) 8 ' 26 
endfor 
G.COM.GE: 

for i <- 0 to 128-size by size 

aj+size-1..i <- ((rd = rc) ? (Cj +S j ze -1..i ^ 0) : (dj +S i ze -1J ^ c i+S j Z e-1j)) size 
endfor 
G.COM.L.U: 

for i «- 0 to 1 28-size by size 

ai+size-1..i <- ((rd = rc) ? (c i+S j ze .i..i > 0) : 
((0 ||d +S j ze .i..i)<(0 ||Ci +siZ e-i..i))) size 

endfor 
G.COM.GE.U: 

for i <- 0 to 1 28-size by size 

ai+size-1 J <- ((rd = rc) ? (Cj +S ize-1J ^ 0) : 
((0 || d i+S ize-1 ..i) * (0 II q +S ize-1..i))) sj2e 

endfor 

endcase 
if (a * 0) then 

raise FixejJPointArithmetic 

end if 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 35C 



E.L0G.M0ST.8 


Ensemble log of most significant bit signed bytes 


E.L0G.M0ST.16 


Ensemble log of most significant bit signed doublets 


E.LOG.MOST.32 


Ensemble log of most significant bit signed quadlets 


E.LOG.MOST.64 


Ensemble log of most significant bit signed octlets 


E.LOG.MOST.128 


Ensemble log of most significant bit signed hexlet 


E.L0G.M0ST.U.8 


Ensemble log of most significant bit unsigned bytes 


E.L0G.M0ST.U.16 


Ensemble log of most significant bit unsigned doublets 


E.LOG.MOST.U.32 


Ensemble log of most significant bit unsigned quadlets 


E.LOG.MOST.U.64 


Ensemble log of most significant bit unsigned octlets 


E.LOG.MOST.U.128 


Ensemble log of most significant bit unsigned hexlet 
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Selection 



class 


op 


size 


sum 


SUM 


8 16 32 64 


SUM.U 


1 8 16 32 64 


log most 
significant bit 


LOG.MOST LOG.MOST.U 


8 16 32 64 128 
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Format 

E.op.size rd=rc 
rd=eopsize(rc) 

31 24 23 18 17 12 11 6 5 0 

I E.size | rd | rc | op | E.UNARY | 

8 6 6 6 6 
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Definition 



def EnsembleUnary(op,size,rd,rc) 
c RegRead(rc, 128) 
cas op of 

E.LOG.MOST: 

for i <- 0 to 128-size by size 
'f(ci+size-1..i=0)then 

ai+slze-1..i<--1 

else 

for j <- 0 to size-1 

if Csize-1+j. j+| = (c%\jg]i\ II not c size-1+l) th ^n 
ai+size-1..i<-j 

endif 
endfor 

endif 
endfor 
E.LOG.MOSTU: 

for i «- 0 to 128-size by size 

^(Ci+size-U^OJthen 

aj+size-1..i<--1 

else 

for j <- 0 to size-1 

ifc S ize-1 + i..H = (0 size ' 1 -i||1)then 

ai+size-1..i<-j 

endif 
endfor 

endif 
endfor 
E.SUM: 

p[ 0]<-o 1 28 

for i <- 0 to 128-size by size 

p[i+size] <- p[i] + (c^ize || c S ize-1+Li) 
endfor 
a<-p[128] 
E.SUMU: 

p[0]<-0 128 

for i <- 0 to 128-size by size 

p[i+size] <- p[i] + (0^8-size || c size .i +U ) 
endfor 
a«-p[128] 

endcase 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 
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Floating-point function Definitions 

defetx- bits(prec)as 
cas prefof 
16: 

eb<-5 

32: 

eb*-8 

64: 

eb*-11 

128: 

eb4-15 

endcase 
enddef 

def eb <- ebias(prec) as 

eb<-0||1 ebits (P rec M 
enddef 

def fb <- fbits(prec) as 
fb <- prec - 1 - eb 
nddef 

def a <- F(prec, ai) as 
a.s «- aip r ec-l 
ae <- aip r ec-2..fbits(prec) 

af<-aifbits(prec)-1..0 
jfae=:1 ebits(prec) then 

if af = 0 then 

a.t <- INFINITY 
elseif affbits(prec)-1 1* 160 

a.t <- SNaN 

a.e 4- -fblts(prec) 

a.f<- 1 || affbits(prec)-2..0 

else 

a.t <- QNaN 
a.e -fbits(prec) 
a.f <- af 

endif 
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els ifae = Othen 
tf af = Othen 

a.t*- ZERO 

else 

a.t «- NORM 

a.e <- 1-ebias(prec)-fbits(prec) 
a.f<-0||af 

endif 

else 

a.t <- NORM 

a.e <- ae-ebias(prec)-fbits(prec) 
a.f<-1 || af 

endif 
enddef 

def a <- DEFAULTQNAN as 

a.s<-0 

a.t <- QNAN 

a.e <- -1 

a.f<-1 
enddef 

def a <- DEFAULTSNAN a$ 

a.s «- 0 

a.t <- SNAN 

a.e <- -1 

a.f<-1 
enddef 

def fadd(a,b) as faddr(a,b,N) enddef 

def c <- faddr(a,b,round) as 

if a.t=NORM and b.t=NORM then 

// d,e are a,b with exponent aligned and fraction adjusted 
if a.e > b.e then 
d«-a 
e.t<-b.t 
e.s <- b.s 
e.e <- a.e 

e.f<-b.f || 0 ae - be 
else if a.e < b.e then 
d.t <- a.t 
d.s «- a.s 
d.e <- b.e 

d.f<- a .f || 0 be - ae 
e<-b 

endif 
c.t <- d.t 

c.e <- d.e 

if d.s = e.s then 

c.s d.s 

c.f <- d.f + e.f 
elseifd.f >e.f then 

c.s <- d.s 

c.f <- d.f - e.f 
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elsetf d.f < e.f then 
c.s <- .s 
c.f<-e.f-d.f 

else 

c.s <- r=F 
c.t«-ZERO 

endif 

// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 
c<- b 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c^-a 

elseif a.t=ZERO and b.t=ZERO then 
at «- ZERO 

c.s <- (a.s and b.s) or (round=F and (a.s or b.s)) 
// NULL values are like zero, but do not combine with ZERO to alter sign 
elseif a.t=ZERO or a.t=NULL then 

c <- b 

elseif b.t=ZERO or b.t=NULL then 
c < a 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c <- DEFAULTSNAN // Invalid 

else 

c <- a 

endif 

elseif a.t=INFINITY then 
c 4 a 

elseif b.t=INFINITY then 
c <- b 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def b <- fneg(a) as 

b.s <- -a.s 

b.t «- a.t 

b.e <- a.e 

b.f <- a.f 
enddef 

def fsub(a.b) as fsubr(a,b,N) enddef 

def fsubr(a,b,round) as faddr(a,fneg(b),round) enddef 

def frsub(a,b) as frsubr(a,b,N) enddef 

def frsubr(a,b,round) as faddr(fheg(a),b,round) enddef 

def c <r- fcom(a.b) as 

if (a.t=SNAN) or (a.t=QNAN) or (b.t=SNAN) or (b.t=QNAN) then 
c<- U 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c «- (a.s=0) ? G: L 
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else 

c«-E 

endif 

elseif a.t=INFINITY then 

c <- (a.s=0) ? G: L 
elseif b.t=INFINITY then 

c <- (b.s=0) ? G: L 
elseif a.t=NORM and b.t=NORM then 

if a.s * b.s then 

c 4- (a.s=0) ? G: L 

else 

if a.e > b.e then 
af <- a.f 

bf*-b.f||O ae - be 

else 

af <-a.f ||O be - ao 
bf«-b.f 

endif 

if af = bf then 
c <- E 

else 

c<-((a.s=0) A (af>bf))?G:L 

endif 

endif 

elseif a.t=NORM then 

c «- (a.s=0) ? G: L 
elseif b.t=NORM then 

c<-(b.s=0)?G:L 
elseif a.t=ZERO and b.t=ZERO then 
c*-E 

else 

assert FALSE // should have covered at the cases above 

endif 
enddef 

def C4-fmul(a,b) as 

if a.t=NORM and b.t=NORM then 

c.s <- a.s A b.s 

c.t <- NORM 

c.e «- a.e + b.e 

c.f<-a.f* b.f 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s <- a.s A b.s 

c.t <- b.t 

c.e <- b.e 

c.f<-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s <- a.s A b.s 
c.t<-a.t — * 
c.e 4- a.e 
c.f <- a.f 

elseif a.t=ZERO and b.t=INFINITY then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=ZERO then 

c *- DEFAULTSNAN // Invalid 
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Iseif a.t=ZERO or b.t=ZERO then 
c.s «- a.s A b.s 
at <- ZERO 

else 

assert FALSE // should have covered al the cases abov 

endif 
enddef 

def c <- fdivr(a t b) as 

if a.t=NORM and b.t=NORM then 
c.s <- a.s A b.s 
c.t <- NORM 
c.e <- a.e - b.e + 256 

c.f<-(a.f II 0 256 )/b.f 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s <- a.s A b.s 

c.t <- b.t 

c.e «- b.e 

c.f<-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s <- a.s A b.s 
c.t <- a.t 
c.e <- a.e 
c.f <- a.f 

elseif a.t=ZERO and b.t=ZERO then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=INFINITY then 

c «- DEFAULTSNAN // Invalid 
elseif a.t=ZERO then 

c.s <- a.s A b.s 

c.t <- ZERO 
elseif a.t=INFINITY then 

c.s <- a.s A b.s 

c.t <- INFINITY 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def msb <- findmsb(a) as 

MAXF 2 1 8 // Largest possible f value after matrix multiply 
forj<-OtoMAXF 

if aMAXF-1 ..j = (oM^-H || 1 ) then 
msb<-j 

endif 
endfor 
enddef 

def ai <- PackF(prec,a,round) as 
case a.t of 
NORM: 

msb <- findmsb(a.f) 

rn <- msb-l-fbits(prec) // Isb for normal 

rdn -ebias(prec)-a.e-1-fbits(prec) // Isb if a denormal 

rb <- (rn > rdn) ? rn : rdn 
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if rb £ 0 then 

aifr<-a.f ms b-1..0 II 0"* 
eadj <- 0 

else 

case round of 
C: 

s <- Q™$b-rt> || (-a.s)* 

F: 

s <- 0™**-* || (a.s)* 
N, NONE: 

s ^ 0 msb.rb ( | _ afrb || af rg-1 

X: 

if a.frt>-i ..o * 0 then 

raise FloatingPointArithmetic // Inexact 

endif 
s<-0 

Z: 

s<-0 

endcase 

v^(0||a.f ms b..0) + (0||s) 
ifv msb= 1 then 

aifr^-vmsb-L.rt) 

eadj <- 0 

else 

aifr^O^Mprec) 
eadj <- 1 

endif 

endif 

aien <- a.e + msb - 1 + eadj + ebias(prec) 
if aien s 0 then 

if round = NONE then 

ai <- a.s || o ebits (P rec ) || aifr 

else 

raise FloatingPointArithmetic //Underflow 

endif 

elseif aien ;> iebits(prec) then 
if round = NONE then 

//default: round-to-nearest overflow handling 
ai <- a.s || lebits(prec) ( | 0 fbits(prec) 

else 

raise FloatingPointArithmetic //Underflow 

endif 

else 

ai <- a.s || aien e bjts(prec)-1..0 II a jfr 

endif 
SNAN: 

if roumt * NONE then 

raise FloatingPointArithmetic //Invalid 

endif 

if -a.e < fbits(prec) then 

ai <- a.s || l©bits(prec) |j a .f_ a . e -1..0 II 0 fbits <P rec ) +a e 
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else 

Isb 4- a.f. a .e-1-fbits(prec)+1..0 * 0 

ai <- a.s || iebits(prec) ,| a.f. a .e-1...a.e.1.fbits(prec)+2 II Isb 

endif 
QNAN: 

if -a.e < fbits(prec) then 

ai 4- a.s || i©bits(prec) || a.f. a .e-i..o II O^'* 5 ^ 60 ^ 3 * 6 

else 

Isb 4- a.f_ a .e-i-fbits(prec)+1..0 * 0 

ai 4- a.s || lebits(prec) g a.f- a .e-1..-a.e-1-fbits{prec>+2 II Isb 

endif 
ZERO: 

ai <- a.s || o ebits (P rec ) || o^ts^ 60 ) 
INFINITY: 

ai 4- a.s || lebits(prec) |j 0 fbits(prec) 

endcase 
defdef 

def ai <- fsinkr(prec, a, round) as 
case a.t of 
NORM: 

msb 4- findmsb(a.f) 
rb <- -a.e 
if rb <, 0 then 

aifr^a.f ms b..Ol|0" rb 
aims 4- msb - rb 

else 

case round of 
C, CD: 

s <- o msb - rb || (-aLs)* 
F, F.D: 

s 4- Q™sb-*> || (ai.s)* 
N, NONE: 

s 4- omsb-rb || -ai.ffb || ai.f^ 1 

X: 

if ai.frb-1 ..o*0 then 

raise FloatingPointArithmetic // Inexact 

endif 
s 4- 0 
Z, Z.D: 

S 4- 0 

endcase 

V4-(0||a.f msb ..o) + (0||s) 
' f v msb = 1 then 

aims 4- msb + 1 - rb 

else 

, aims 4- msb - rb 

endif 

aifr 4- v a jms..rb 

endif 

if aims > prec then 
case round of 

CD, F.D, NONE, Z.D: 

ai 4- a.s || (-as)P rec - 1 
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C, F, N, X, Z: 

raise FloatingPointArithmetic // Overflow 

endcase 
elseif a.s = 0 then 
ai «- aifr 

else 

ai <- -aifr 

endif 
ZERO: 

ai <- oP rec 
SNAN, QNAN: 

case round of 

CD, F.D, NONE, Z.D: 

ai <- oPrec 
C, F, N, X, Z: 

raise FloatingPointArithmetic // Invalid 

endcase 
INFINITY: 

case round of 

CD, F.D, NONE, Z.D: 

ai <- a.s || (~as)P rec " 1 
C, F, N, X, Z: 

raise FloatingPointArithmetic // Invalid 

endcase 

endcase 
enddef 



def c <- frecrest(a) as 
b.s <- 0 
b.t <- NORM 
b.e <- 0 
b.f<-1 

c <- fest(fdiv(b,a)) 
enddef 

def c <- frsqrest(a) as 
b.s<-0 
b.t <- NORM 
b.e <- 0 
b.f<-1 

c <- fest(fsqr(fdiv(b,a))) 
enddef 

def c <- fest(a) as 

if (a.t=NORM) then 

msb <- findmsb(a.O 
a.e <~ a.e + msb- 13 

a.f<-a.f ms b..msb-12ll 1 

else 

c«-a 

endif 
enddef 

def c <- fsqr(a) as 

if (a.t=NORM) and (a.s=0) then 
c.s«-0 
c.t <- NORM 
if (a.eo = 1)then 
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c.e<-(a.e-127)/2 
c.f<-sqr(a.f ||0 127 ) 

else 

c.e4-(a.e-128)/2 
c.f*-sqr(a.f ||0 128 ) 

endif 

elself (a.t=SNAN) or (a.t=QNAIM) or a.t=ZERO or ((a.t=INFINITY) and (a.s=0)) then 
c < a 

elseif ((a.t=NORM) or (a.t=INFINITY)) and (a.s=1) then 
c <- DEFAULTSNAN // Invalid 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

Fig. 37 (cont'd) 
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Pncomhlo mi iltinlv/ floatino-ooint cinolo ooilino 

ciiociiiuic inutupiy MUdiiiiy-puiiii oinyic uoiiifiy 


C Ml II P 19 P 
t.MULr.o^.r 


Cncomhlo mi iltinlv/ flnotinn_n^int cinolo floor 

cnsGmuie muiupiy iiudiiny-puiiu binyit? nuur 


P Ml II P 19 M 
t.lVIUL.r.oZ.IN 


Pncomhlo mi iltinlv/ floatino-ooint cinolo no a roc t 
CFlbclTlUIti MlUIUpiy HUdlll iy~puil 11 oil iy 1c lltJdlcOl 


P Ml II P 19 Y 


Pncomhlo mi iltinlv/ floatino-ooint cinolo ova of 

ciiotJinuitJ inuiupiy iiuduiiy-puuii oinyic t?Adui 


P Ml II P 19 "7 


Pncomhlo mi iltinlv/ floatino-noint cinolo 70m 

cno6niui6 rnuiupiy iiudin ly-puiiu binyic t&w 


P Ml II P f\A 


Pncomhlo mi iltinlv/ floatino.ooint Hoi ihlo 
cubciiiuitJ inuiupiy iiudiii iy*puii 11 uuuuit; 


P Ml II P f\A P 


Pncomhlo mi iltinlv/ floatino.noint Hoi ihlo ooilino 

cnotJiiiuit? muiupiy uuduriy^puiiu uuuuic ociuiiy 


P Ml II P ftA P 


Pncomhlo mi iltinlv/ flootino.ooint Hoi ihlo floor 

criocmijit? muiupiy iiuauiiy*puini uuuuic uuui 


P Ml II P RA M 
£ . IVI U L . r . D *t . IN 


Pncomhlo mi iltinlv/ floatino-ooint Hoi ihlo nosroct 
ciibtJiiiuit; rnuiupiy iiuduiiy-puiiu uuuuic? ncdicsoi 


P ivyii II P ftA Y 
C.MUL.r.DH.A 


Pncomhlo mi iltinlv/ floatino-noint Hoi ihlo ovaot 
ciiocinuic iTiuiupiy uudiiny-puiiu uuuuic t?Adui 


C KA\ II P ft/I "7 


CncomhlA mi iltinlw fl^otin/i n^int Hai ihlo 70m 

crioemuie muiupiy Tiuauny-puini uuuuic z.ciu 


cr Ml 11 C 1 OQ 

t.MUL.r. i^o 


Cncamhlo mi iltinlv/ flnotinn_ nnint m 10H 

cnsemDie muiupiy Tiuauny-poini quaa 


E MUL F 128 C 


Ensemble multiolv floatina-ooint Quad ceilina 


E.MULF.128.F 


Ensemble multiply floating-point quad floor 


E.MULF.128.N 


Ensemble multiply floating-point quad nearest 


E.MULF.12SX 


Ensemble multiply floating-point quad exact 


E.MUL.F.128.Z 


Ensemble multiply floating-point quad zero 



Fig. 38A (cont'd) 



Selection 



class 


op 


prec 


round/trap 


add 


EADDF 


16 32 64 128 


NONE C F N X Z 


divide 


EDIVF 


16 32 64 128 


NONE C F N X Z 


multiply 


EMULF 


16 32 64 128 


NONE C F N X Z 


complex multiply 


EMUL.C 
F 


16 32 64 


NONE 



Format 

E.op.prec.round rd=rc,rb 
rd=eopprecround(rc,rb) 

31 24 23 18 17 12 11 65 0 

I E.prec | rd I rc | rb I op.round | 

8 6 6 6 6 



Fig. 38B 



Definition 

def mul(size f v,i t wj) as 

mul <- fmul(F(size,v S j Ze -i +u),F(size,w S j Z e-1 +j. j)) 
enddef 

def EnsembleFloatingPoint(op,prec,round,ra f rb,rc) as 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i <- 0 to 1 28-prec by prec 
ci<-F(prec f Ci +P rec-1.j) 

bi4-F(prec f bi +P rec-1..i) 
case op of 

E.ADD.F: 

ai <- faddr(ci,bi,round) 
E.MULF: 

ai <- fmul(ci,bi) 
E.MULC.F: 

if (i and prec) then 

ai <- faddfmuKprec.cj.b.i-prec), mul(prec,c,i-prec t b,i)) 

else 

ai <- fsubfmuKprec.cJ.bJ), muKprecci+prec.b.i+prec)) 

endif 
E.DIV.F.: 

ai <- fdiv(ci.bi) 

endcase 

ai+prec-1..i «- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 38C 



Operation codes 



E.MULADD.C.F.16 


Ensemble multiply add complex floating-point half 


E.MULADD.C.F.32 


Ensemble multiply add complex floating-point single 


E.MUL.ADD.C.F.64 


Ensemble multiply add complex floating-point double 


E.MULADD.F.16 


Ensemble multiply add floating-point half 


E.MUL.ADD.F.16.C 


Ensemble multiply add floating-point half ceiling ! 


E.MULADD.F.16.F 


Ensemble multiply add floating-point half floor 


E.MULADD.F.16.N 


Ensemble multiply add floating-point half nearest 


E.MULADD.F.16.X 


Ensemble multiply add floating-point half exact 


E.MULADD.F.16.Z 


Ensemble multiply add floating-point half zero 


E.MUL.ADD.F.32 


Ensemble multiply add floating-point single 


E.MULADD.F.32.C 


Ensemble multiply add floating-point single ceiling 


E.MULADD.F.32.F 


Ensemble multiply add floating-point single floor 


E.MUL.ADD.F.32.N 


Ensemble multiply add floating-point single nearest 


E.MULADD.F.32.X 


Ensemble multiply add floating-point single exact 


E.MUL.ADD.F.32.Z 


Ensemble multiply add floating-point single zero 


E.MULADD.F.64 


Ensemble multiply add floating-point double 


E.MULADD.F.64.C 


Ensemble multiply add floating-point double ceiling 


E.MULADD.F.64.F 


Ensemble multiply add floating-point double floor 


E.MUL.ADD.F.64.N 


Ensemble multiply add floating-point double nearest 


E.MULADD.F.64.X 


Ensemble multiply add floating-point double exact 


E.MUL.ADD.F.64.Z 


Ensemble multiply add floating-point double zero 


E.MULADD.F.128 


Ensemble multiply add floating-point quad 


E.MULADD.F.128.C 


Ensemble multiply add floating-point quad ceiling 


E.MULADD.F.128. F 


Ensemble multiply add floating-point quad floor 


E.MULADD.F.128. N 


Ensemble multiply add floating-point quad nearest 


E.MUL.ADD.F. 128.X 


Ensemble multiply add floating-point quad exact 


E.MULADD.F.128.Z 


Ensemble multiply add floating-point quad zero 


E.MUL.SUB.C.F.16 


Ensemble multiply subtract complex floating-point half 


E.MULSUB.C.F.32 


Ensemble multiply subtract complex floating-point single 


E.MULSUB.C.F.64 


Ensemble multiply subtract complex floating-point double 


E.MUL.SUB.F.16 


Ensemble multiply subtract floating-point half 


E.MUL.SUB.F.32 


Ensemble multiply subtract floating-point single 


E.MUL.SUB.F.64 


Ensemble multiply subtract floating-point double 


E.MUL.SUB.F.128 


Ensemble multiply subtract floating-point quad 



Fig. 38D 



Selection 



class 


op 


type 


prec 


round/trap 


multiply add 


E.MUL.AD 
D 


F 


16 32 64 128 


NONE C F N X Z 


C.F 


16 32 64 


NONE 


multiply subtract 


E.MULSU 
B 


F 


16 32 64 128 


NONE 


C.F 


16 32 64 


NONE 



Format 



E.op.size rd@rc,rb 
rd=eopsize(rd,rc,rb) 

31 24 23 18 17 12 11 6_5 0_ 

| E.size | rd | rc I rb | op | 

8 6 6 6 6 

Fig. 38E 



Definition 

def mul(size,v,i,w,j) as 

mul <- fmul(F(size f v S i Z e-i+i.,i),F(size f w S i ze .i+j..j)) 
enddef 

def EnsemblelnplaceFloatingPoint(op,size,rd,rc,rb) as 
d «- RegRead(rd, 128) 
c «- RegRead(rc t 128) 
b RegRead(rb, 128) 
for i *- 0 to 128-size by size 
di<-F(prec ( d l+ prec-1..i) 
case op of 

E.MULADD.F: 

ai <- fadd(di, mul(prec f c,i,b,i)) 
E.MULADD.C.F: 

if (i and prec) then 

ai <- fadd(di, fadd(mul(prec,c,i,b,i-prec), mul(c,i-prec,b f i))) 

else 

ai <- fadd(di, fsub(mul(prec,c,i,b,i) f mul(prec,c,i+prec,b,i+prec))) 

endif 
E.MULSUB.F: 

ai <- frsub(di, mul(prec,c,i,b,i)) 
E.MULSUB.C.F: 

if (i and prec) then 

ai <- frsub(di f fadd(mu!(prec I c f i,b,i-prec) l mul(c,i-prec,b,i))) 

else 

ai <r- frsub(di, fsub(mul(prec,c,i f b,i), mul(prec,cj+prec,b,i+prec))) 

endif 

endcase 

aj+prec-1 ..i <- PackF(prec f ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 

Fig. 38F 



Operation codes 



E.SCAL.ADD.F.16 


Ensemble scale add floating-point half 


E.SCAL.ADD.F.32 


Ensemble scale add floating-point single 


E.SCAL.ADD.F.64 


Ensemble scale add floating-point double 



Fig. 38G 



Sel cti n 



class 


op 


prec 


scale add 


E.SCAL.ADD.F 


16 32 64 



Format 



E.SCAL.ADD.F.size ra=rd,rc,rb 
ra=escaladdfsize(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I op I rd | rc | rb | ra | 

8 6 6 6 6 



Fig. 38H 



D finiti n 



def EnsembleFloatingPointTernarytop.prec.rd.rcrb.ra) as 
d<-RegR ad(rdJ28) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i 4- 0 to 1 28-prec by prec - 

di^-FCprecdi+prec-l.j) 

ci<~F(prec l Cj +P rec-1..i) 

ai <r- fadd(fhnul(di, F(prec,b pre c-l..o)). fmul(ci, F(prec,b2»prec-1..prec))) 
ai+prec-1..i «- PackF(prec, ai f none) 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 



Fig. 381 



E.SUB.F.16 


Ensemble subtract floating-point half 


E.SUB.F.16.C 


Ensemble subtract floating-point half ceiling 


E.SUB.F.16.F 


Ensemble subtract floating-point half floor 


E.SUB.F.16.N 


Ensemble subtract floating-point half nearest 


E.SUB.F.16.Z 


Ensemble subtract floating-point half zero 


E.SUB.F.16.X 


Ensemble subtract floating-point half exact 


E.SUB.F.32 


Ensemble subtract floating-point single 


E.SUB.F.32.C 


Ensemble subtract floating-point single ceiling 


E.SUB.F.32.F 


Ensemble subtract floating-point single floor 


E.SUB.F.32.N 


Ensemble subtract floating-point single nearest 


E.SUB.F.32.Z 


Ensemble subtract floating-point single zero 


E.SUB.F.32.X 


Ensemble subtract floating-point single exact 


E.SUB.F.64 


Ensemble subtract floating-point double 


E.SUB.F.64.C 


Ensemble subtract floating-point double ceiling 


E.SUB.F.64.F 


Ensemble subtract floating-point double floor 


E.SUB.F.64.N 


Ensemble subtract floating-point double nearest 


E.SUB.F.64.Z 


Ensemble subtract floating-point double zero 


E.SUB.F.64.X 


Ensemble subtract floating-point double exact 


E.SUB.F.128 


Ensemble subtract floating-point quad 


E.SUB.F.128.C 


Ensemble subtract floating-point quad ceiling 


E.SUB.F.128.F 


Ensemble subtract floating-point quad floor 


E.SUB.F.128.N 


Ensemble subtract floating-point quad nearest 


E.SUB.F.128.Z 


Ensemble subtract floating-point quad zero 


E.SUB.F.128.X 


Ensemble subtract floating-point quad exact 



Fig. 39A 



Selection 



class 


PR 


_prec 


round/trap 


set 


SET. 
E LG 
L GE 


16 32 64 128 


NONE X 


subtract 


SUB 


16 32 64 128 


NONE C F N X Z 



Format 

E.op.prec.round rd=rb,rc 
rd=eopprecround(rb,rc) 

31 24 23 18 17 12 11 65 0 

I E.prec I rd | rc | rb I op.round | 

8 6 6 6 6 



Fig. 39B 



Definition 



def EnsembleReversedFloatingPoint(op,prec f round f rcl,rc f rb) 
c <- RegRead(rc, 128) 
b +- RegRead(rb, 128) 
for i 0 to 128-prec by pr c 

ci<~F(prec > Cj +pr ec-i..j) 

bi<-F(prec f bi +pr ec-l.j) 

ai <- frsubr(ci,-bi, round) 

ai+prec-1..i <- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 39C 



Operati n codes 



G.SET.E.F.Io 


oroup sei equal noaung-poini naii 


O OCX C C 4 C V 

G.oET.E.r.lb.X 


oroup set equal noaung-poini naii exact 


OCT C C OO 

G.SET.E.F.32 


oroup sei equal Tioaung-poini single 


O OCT C C OO V 

G.SET.E.F.32.X 


oroup sei equal noaung-poini single exact 


j-\ OCT C C C4 

G.SET.E.F.64 


oroup set equal iioaung-point aouoie 


OCT F F fiil V 

G.SET.E.F.64.X 


oroup sei equal noaung-point oouuie exact 


/> OCT C C 4 OO 

G.5ET.E.F.128 


oroup set equal iioaung-point quae 


/"% OCT C C 4 OO \/ 

G.SET.E.F.128.X 


oroup set equal iioaung-point quae exact 


/** O CT ^"*C C 4 £S V 

G.oE I .Gb.r.lo.A 


oroup set greater equal noaung-poini nan exact 


/-* OCT /"»C C OO V 

G.SET.GE.F.32.X 


oroup set greater equal noaung-point single exact 


/■> OCT f*C C C 4 V 

G.5ET.GE.F.64.X 


oroup set greater equal noaung-point aouDie exact 


/■> OCT /"*C FT 4 OO V 

G.SET.GE.r. 128.X 


Group set greater equal floating-point quad exact 


^ O CT 1 f+ C 4 C 

G.SET.LG.F.16 


oroup set less greater noaung-poini naii 


O CT 1 P C V 

G.SET.LG.F.16.X 


oroup sei less greater noaung-poini naii exact 


/"* oct i c oo 
G.SET.LG.F.32 


oroup set less greater noating-point smgie 


OCT 1 C OO V 

G.5ET.LG.F.32.X 


oroup set less greater iioaung-point smgie exact 


OCT 1 ^ F" 4 

G.SET.LG.F.64 


r^^Al ■ A **A^ Ia\AA /VPAA^AP tlAAflAA ma! A^ iUIa 

oroup set less greater floating-point aouoie 


^ OCT 1 FT 0 4 \/ 

G.SET.LG.F.64.X 


Group set less greater floating-point double exact 


OCT 1 f> F" 4 OO 

G.SET.LG.F.128 


Group set less greater floating-point quad 


O OFTT 1 r~ 400 \/ 

G.SET.LG.F. 128.X 


Group set less greater floating-point quad exact 


/*> OCT 1 C 4^ 

G.SET.L.F.16 


oroup set less tioaung-point naii 


/•"% OCT 1 C <IC V 

G.SET.L.F.16.X 


w m0\ t i A oa^ lAf*r% flAAfiAA AAtr^^ WaIt av^aa^ 

oroup set less floating-point nai? exact 


/-> OCT 1 C OO 

G.SET.L.F.32 


oroup set less noating-point smgie 


OFT i f* oo \/ 

G.SET.L.F.32.X 


Group set less floating-point single exact 


CI OCT 1 C fij, 


Grouo set less floatinn-noint double 


G.SET.L.F.64.X 


Group set less floating-point double exact 


G.SET.LF.128 


Group set less floating-point quad 


G.SET.L.F.128.X 


Group set less floating-point quad exact 


G.SET.GE.F.16 


Group set greater equal floating-point half 


G.SET.GE.F.32 


Group set greater equal floating-point single 


G.SET.GE.F.64 


Group set greater equal floating-point double 


G.SET.GE.F.128 


Group set greater equal floating-point quad \ 



Fig. 39D 



Equival ncies 



G.SET.LE.F.16.X 


Group set less equal floating-point half exact 


G.SET.LE.F.32.X 


Group set less equal floating-point single exact 


G.SET.LE.F.64.X 


Group set less equal floating-point double exact 


G.SET.LE.F.128.X 


Group set less equal floating-point quad exact 


G.SET.G.F.16 


Group set greater floating-point half 


G.SET.G.F.16.X 


Group set greater floating-point half exact 


G.SET.G.F.32 


Group set greater floating-point single \ 


G.SET.G.F.32.X 


Group set greater floating-point single exact 


G.SET.G.F.64 


Group set greater floating-point double 


G.SET.G.F.64.X 


Group set greater floating-point double exact 


G.SET.G.F.128 


Group set greater floating-point quad 


G.SET.G.F.128.X 


Group set greater floating-point quad exact 


G.SET.LE.F.16 


Group set less equal floating-point half 


G.SET.LE.F.32 


Group set less equal floating-point single 


G.SET.LE.F.64 


Group set less equal floating-point double 


G.SET.LE.F.128 


Group set less equal floating-point quad 



G.SET.G.F.prec rd=rb,rc 


-» G.SET.L.F.prec rd=rc,rb 


G.SET. G.F.precX rd-rb,rc 


-» G.SET.LF.preaX rd=rc,rb 


G.SET.LE.F.prec rd=rb,rc 


-+ G.SET.GE.F.prec rd=rc,rb 


G.SET.LE.F.precX rd-rb,rc 


-> G.SET.GE.F.preaX rd=rc,rb 



Fig. 39E 



Selection 



class 


op 


prec 


round/trap 


set 


SET. 
E LG 
L GE 
G LE 


16 32 64 128 


NONE X 



Format 



G.op.prec.round rd=rb,rc 
rc=gopprecround(rb,ra) 

31 24 23 18 17 12 11 6 5 0 

I G.prec I rd | rc I rb | op.round I 

8 6 6 6 6 



Fig 39F 



Definition 



def GroupFloatingPointReversedCop.prec.round^d.rc.rb) as 
c^-RegR ad(rc, 128) 
b <- RegRead(rb, 128) 
for i <- 0 to 128-prec by pr c 
ci<-F(pr c,Ci + p r ec-l.j) 
bi^Ffprec.bj+prec-i.j) 
if round*NONE then 

if (di.t = SNAN) or (ci.t = SNAN) then 
raise FloatingPointArithmetic 

endif 

case op of 

G.SET.LF, G.SET.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.SET.LF: 

ai <- bi?>ci 
G.SET.GE.F: 

ai <- bi!?<ci 
G.SET.E.F: 

ai <~ bi=ci 
G.SET.LG.F: 

ai <r- bi*ci 

endcase 

ai+prec-1..i«-aiP rec 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 



Floating-point arithmetic 



Fig. 39G 



G COM E F 16 


Group compare equal floating-point half 


G COM E F 16 X 

W.VSV./IVI,L..I • I v.A 


Group compare equal floating-point half exact 


G COM E F 32 


Group compare equal floating-point singl 


G COM E F 32 X 


Group compare equal floating-point single exact 


G COM E F 64 


Group compare equal floating-point double 


G COM F F 64 X 


Group compare equal floating-point double exact 


G COM F F 128 


Group compare equal floating-point quad 


G COM E F 128 X 


Group compare equal floating-point quad exact 


G COM GE F 16 


Group compare greater or equal floating-point half 


G COM GE F 16 X 

vjp.v/vyivi .vju! f • iw.A 


Group compare greater or equal floating-point half exact 


G COM GE F 32 


Group compare greater or equal floating-point single 


G COM GE F 32 X 


Group compare greater or equal floating-point single exact 


G COM GE F 64 


Group compare greater or equal floating-point double 


G COM GE F 64 X 


Group compare greater or equal floating-point double exact 


G COM GE F 128 


Group compare greater or equal floating-point quad 


G COM GE F 128 X 


Group compare greater or equal floating-point quad exact 


G COM L F 16 


Group compare less floating-point half 


G COM L F 16 X 

\J . VsVm/IVI .L.I ■ 1 V/iA 


Group compare less floating-point half exact 


G COM L F 32 


Group compare less floating-point single 


G COM L F 32 X 


Group compare less floating-point single exact 


G COM L F 64 

VJ . WV-/IVI .L.I .V/*T 


Group compare less floating-point double 


G COM L F 64 X 

VJ . W\-/IVI .L.I . U*T./\ 


Group compare less floating-point double exact 


G COM L F 128 

\J . V-/ V/l VI .L.I. 1 ^Vs 


Group compare less floating-point quad 


G COM L F 128 X 


Group compare less floating-point quad exact 


G COM L G F 16 

\J7 . V^V«/I VI . LVJ . 1 . 1 KJ 


Group compare less or greater floating-point half 


G COM LG F 16 X 


Group compare less or greater floating-point half exact 


G COM LG F 32 

V?. VSL/IVI.Lv^* 1 »\J^ 


Group compare less or greater floating-point single 


G COM LG F 32 X 


Group compare less or greater floating-point single exact 


G.COM.LG.F.64 


Group compare less or greater floating-point double 


G.COM.LG.F.64.X 


Group compare less or greater floating-point double exact 


G.COM.LG.F.128 


Group compare less or greater floating-point quad 


G.COM.LG.F.128.X 


Group compare less or greater floating-point quad exact 



Fig. 40A 



Format 



G.COM.op.prec.round rd.rc 
rc=gcomopprecround(rd,rc) 

31 24 23 18 17 12 11 65 0 

I G.prec | rd | rc | op | GCOM \ 

8 6 6 6 6 



Fig. 40B 



Definition 



def GroupCompareFloatingPoint(op,prec,round,rd,rc) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
for i «- 0 to 128-prec by prec 
di^Ftprecdi+prec-l..!) 
ci^-FCpreccKprec-l.-i) 
if round*NONE then 

if (di.t = SNAN) or (ci.t = SNAN) then 
raise FloatingPointArithmetic 

endif 

case op of 

G.COM.LF, G.COM.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.COM.LF: 

ai <- di?£ci 
G.COM.GE.F: 

ai <- di!?<ci 
G.COM.E.F: 

ai <- di=ci 
G.COM.LG.F: 

ai <- di^ci 

endcase 

a i+prec-1..» «- a * 
endfor 

if (a * 0) then 

raise FloatingPointArithmetic 

endif 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 40C 



E.ABS.F.16 


Ensemble absolute value floating-point half 


E.ABS.F.16.X 


Ensemble absolute value floating-point half exception 


E.ABS.F.32 


Ensemble absolute value floating-point single 


E.ABS.F.32.X 


Ensemble absolute value floating-point single exception 


E.ABS.F.64 


Ensemble absolute value floating-point double 


E.ABS.F.64.X 


Ensemble absolute value floating-point double exception 


E.ABS.F.128 


Ensemble absolute value floating-point quad 


E.ABS.F.128.X 


Ensemble absolute value floating-point quad exception 


E.C0PY.F.16 


Ensemble copy floating-point half 


E.C0PY.F.16.X 


Ensemble copy floating-point half exception 


E.COPY.F.32 


Ensemble copy floating-point single 


E.COPY.F.32.X 


Ensemble copy floating-point single exception 


E.COPY.F.64 


Ensemble copy floating-point double 


E.COPY.F.64.X 


Ensemble copy floating-point double exception 


E.COPY.F.128 


Ensemble copy floating-point quad 


E.COPY.F. 128.X 


Ensemble copy floating-point quad exception 


E.DEFLATE.F.32 


Ensemble convert floating-point half from single 


E.DEFLATE.F.32.C 


Ensemble convert floating-point half from single ceiling 


E.DEFLATE.F.32.F 


Ensemble convert floating-point half from single floor 


E.DEFLATE.F.32.N 


Ensemble convert floating-point half from single nearest 


E.DEFLATE.F.32.X 


Ensemble convert floating-point half from single exact 


E.DEFLATE.F.32.Z 


Ensemble convert floating-point half from single zero 


E.DEFLATE.F 64 


Ensemble convert floating-point single from double 


E.DEFLATE.F 64 C 


Ensemble convert floating-point single from double ceiling 


E.DEFLATE.F.64.F 


Ensemble convert floating-point single from double floor 


E.DEFLATE.F.64.N 


Ensemble convert floating-point single from double nearest 


E.DEFLATE.F.64.X 


Ensemble convert floating-point single from double exact 


E.DEFLATE.F.64.Z 


Ensemble convert floating-point single from double zero 


E. DEFLATE. F.1 28 


Ensemble convert floating-point double from quad 


E.DEFLATE.F.128 C 


Ensemble convert floating-point double from quad ceiling 


E. DEFLATE. F.1 28.F 


Ensemble convert floating-point double from quad floor 


E.DEFLATE.F.128 N 


Ensemble convert floating-point double from quad nearest 


E.DEFLATE.F 128.X 


Ensemble convert floating-point double from quad exact 


E.DEFLATE.F. 128.Z 


Ensemble convert floating-point double from quad zero 


E.FL0AT.F.16 


Ensemble convert floating-point half from doublets 


E.FL0AT.F.16.C 


Ensemble convert floating-point half from doublets ceiling 


E.FL0AT.F.16.F 


Ensemble convert floating-point half from doublets floor 


E.FL0AT.F.16.N 


Ensemble convert floating-point half from doublets nearest 


E.FL0AT.F.16.X 


Ensemble convert floating-point half from doublets exact 


E.FL0AT.F.16.Z 


Ensemble convert floating-point half from doublets zero 



Fig. 41A 



E.FLOAT.F.32 


Ensemble convert floating-point single from quadlets 


E.FLOAT.F.32.C 


Ensemble convert floating-point single from quadlets ceiling 


E.FLOAT.F.32.F 


Ensemble convert floating-point single from quadlets floor 


E.FLOAT.F.32.N 


Ensemble convert floating-point single from quadlets nearest 


E.FLOAT.F.32.X 


Ensemble convert floating-point single from quadlets exact 


E.FLOAT.F.32.Z 


Ensemble convert floating-point single from quadlets zero 


E.FLOAT.F.64 


Ensemble convert floating-point double from octlets 


E.FLOAT.F.64.C 


Ensemble convert floating-point double from octlets ceiling 


E.FLOAT.F.64.F 


Ensemble convert floating-point double from octlets floor 


E.FLOAT.F.64.N 


Ensemble convert floating-point double from octlets nearest 


E.FLOAT.F.64.X 


Ensemble convert floating-point double from octlets exact 


E.FLOAT.F.64.Z 


Ensemble convert floating-point double from octlets zero 


E.FLOAT.F.128 


Ensemble convert floating-point quad from hexlet 


E.FLOAT.F.128.C 


Ensemble convert floating-point quad from hexlet ceiling 


E.FLOAT.F.128.F 


Ensemble convert floating-point quad from hexlet floor 


E.FLOAT.F.128.N 


Ensemble convert floating-point quad from hexlet nearest 


E.FLOAT.F.128.X 


Ensemble convert floating-point quad from hexlet exact 


E.FLOAT.F.128.Z 


Ensemble convert floating-point quad from hexlet zero 


E.INFLATE.F.16 


Ensemble convert floating-point single from half 


E.INFLATE.F.16.X 


Ensemble convert floating-point single from half exception 


E.INFLATE.F.32 


Ensemble convert floating-point double from single 


E.INFLATE.F.32.X 


Ensemble convert floating-point double from single exception 


E. INFLATE. F.64 


Ensemble convert floating-point quad from double 


E.INFLATE.F.64.X 


Ensemble convert floating-point quad from double exception 


E.NEG.F.16 


Ensemble negate floating-point half 


E.NEG.F.16.X 


Ensemble negate floating-point half exception 


E.NEG.F.32 


Ensemble negate floating-point single 


E.NEG.F.32.X 


Ensemble negate floating-point single exception 


E.NEG.F.64 


Ensemble negate floating-point double 


E.NEG.F.64.X 


Ensemble negate floating-point double exception 


E.NEG.F.128 


Ensemble negate floating-point quad 


E.NEG.F.128.X 


Ensemble negate floating-point quad exception 


E.RECEST.F.16 


Ensemble reciprocal estimate floating-point half 


E.RECEST.F.16.X 


Ensemble reciprocal estimate floating-point half exception 


E.RECEST.F.32 


Ensemble reciprocal estimate floating-point single 


E.RECEST.F.32.X 


Ensemble reciprocal estimate floating-point single exception 


E.RECEST.F.64 


Ensemble reciprocal estimate floating-point double 


E.RECEST.F.64.X 


Ensemble reciprocal estimate floating-point double exception 


E.RECEST.F.128 


Ensemble reciprocal estimate floating-point quad 


E.RECEST.F. 128.X 


Ensemble reciprocal estimate floating-point quad exception 
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E.RSQREST.F.16 


Ensemble floating-point reciprocal square root estimate half 


E.RSQREST.F.1 6.X 


Ensemble floating-point reciprocal square root estimate half exact 


E.RSQREST.F.32 


Ensemble floating-point reciprocal square root estimate single 


E.RSQREST.F.32.X 


Ensemble floating-point reciprocal square root estimate single exact 


E.RSQREST.F.64 


Ensemble floating-point reciprocal square root estimate double 


E.RSQREST.F.64.X 


Ensemble floating-point reciprocal square root estimate double exact 


E.RSQREST.F.1 28 


Ensemble floating-point reciprocal square root estimate quad 


E.RSQREST.F.1 28.X 


Ensemble floating-point reciprocal square root estimate quad exact 


E.SINK.F.16 


Ensemble convert floating-point doublets from half nearest default 


E.SINK.F.16.C 


Ensemble convert floating-point doublets from half ceiling 


E.SINK.F.16.C.D 


Ensemble convert floating-point doublets from half ceiling default 


E.SINK.F.16.F 


Ensemble convert floating-point doublets from half floor 


E.SINK.F.16.F.D 


Ensemble convert floating-point doublets from half floor default 


E.SINK.F.16.N 


Ensemble convert floating-point doublets from half nearest 


E.SINK.F.16.X 


Ensemble convert floating-point doublets from half exact 


E.SINK.F.16.Z 


Ensemble convert floating-point doublets from half zero 


E.SINK.F.16.Z.D 


Ensemble convert floating-point doublets from half zero default 


E.SINK.F.32 


Ensemble convert floating-point quadlets from single nearest default 


E.SINK.F.32.C 


Ensemble convert floating-point quadlets from single ceiling 


E.SINK.F.32.C.D 


Ensemble convert floating-point quadlets from single ceiling default 


E.SINK.F.32.F 


Ensemble convert floating-point quadlets from single floor 


E.SINK.F.32.F.D 


Ensemble convert floating-point quadlets from single floor default 


E.SINK.F.32.N 


Ensemble convert floating-point quadlets from single nearest 


E.SINK.F.32.X 


Ensemble convert floating-point quadlets from single exact 


E.SINK.F.32.Z 


Ensemble convert floating-point quadlets from single zero 


E.SINK.F.32.Z.D 


Ensemble convert floating-point quadlets from single zero default 


E.SINK.F.64 


Ensemble convert floating-point octlets from double nearest default 


E.SINK.F.64.C 


Ensemble convert floating-point octlets from double ceiling 


E.SINK.F.64.C.D 


Ensemble convert floating-point octlets from double ceiling default 


E.SINK.F.64.F 


Ensemble convert floating-point octlets from double floor 


E.SINK.F.64.F.D 


Ensemble convert floating-point octlets from double floor default 


E.SINK.F.64.N 


Ensemble convert floating-point octlets from double nearest 


E.SINK.F.64.X 


Ensemble convert floating-point octlets from double exact 


E.SINK.F.64.Z 


Ensemble convert floating-point octlets from double zero 


E.SINK.F.64.Z.D 


Ensemble convert floating-point octlets from double zero default 


E.SINK.F.128 


Ensemble convert floating-point hexlet from quad nearest default 


E.SINK.F.128.C 


Ensemble convert floating-point hexlet from quad ceiling 


E.SINK.F.1287C.D 


Ensemble convert floating-point hexlet from quad ceiling default 


E.SINK.F.128.F 


Ensemble convert floating-point hexlet from quad floor 


E.SINK.F.128.F.D 


Ensemble convert floating-point hexlet from quad floor default 
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F ^INK F 198 N 
C.OIlNrx.r. in 


Ensemble convert floating-point hexlet from quad nearest 


F ^IMK F 198 X 


Ensemble convert floating-point hexlet from quad exact 


F <^IMK F 198 7 

COIINrVr. \C.\J.&- 


Ensemble convert floating-point hexlet from quad zero 


F ^INK F 198 7 D 

C.OIINrX.r . I l^\J 


Ensemble convert floating-point hexlet from quad zero default 


F <nOR F 1fi 


Ensembl square root floating-point half 


F QOR F 16 P 

C.OWrx.r. lU.w 


Ensemble square root floating-point half ceiling 


F ^HR F 18 F 


Ensemble square root floating-point half floor 


F ^OR P IRN 


Ensemble square root floating-point half nearest 


F ^OR F 16 y 

L.OWrx.r. IU.A 


Ensemble square root floating-point half exact 


F QOR F 18 7 


Ensemble square root floating-point half zero 


F ^OR F 19 


Ensemble square root floating-point single 


F ^OR F 19 P 


Ensemble square root floating-point single ceiling 


F QOR F 19 F 


Ensemble square root floating-point single floor 


F 90R F 19 M 


Ensemble square root floating-point single nearest 


F <nOR F 19 Y 


Ensemble square root floating-point single exact 


F <50R F 19 7 


Ensemble square root floating-point single zero 


F 90R F 84 


Ensemble square root floating-point double 


F ^OR F 84 P 
C.OWrx.r .U*t. w 


Ensemble square root floating-point double ceiling 


F QOR F 64 F 


Ensemble square root floating-point double floor 


F QOR F 64 M 


Ensemble square root floating-point double nearest 


F QOR F 64 Y 


Ensemble square root floating-point double exact 


F ^OR F 64 7 


Ensemble square root floating-point double zero 


F QOR F 198 


Ensemble square root floating-point quad 


F QHR F 198 P 


Ensemble square root floating-point quad ceiling 


F ^OR F 198 F 


Ensemble square root floating-point quad floor 


F ^DR F 198 M 


Ensemble square root floating-point quad nearest 


F QOR F 198 y 


Ensemble square root floating-point quad exact 


F QOR F 198 7 


Ensemble square root floating-point quad zero 


F 91 IM F 16 

C . O U IVI . 1 . i u 


Ensemble sum floating-point half 


F9IIMF1fiP 
c.ouivi.r, io.u 


Ensemble sum floating-point half ceiling 


F IM F 16 F 
c.ouivi.r. lu.r 


Ensemble sum floating-point half floor 


F 91 IM F 16 N 
c..ouivi.r. lu.iN 


Ensemble sum floating-point half nearest 


F IM F 16 y 
c.ouivi.r. lu.A 


Ensemble sum floating-point half exact 


F cm IM F 16 7 
COUIVI.r. lUX 


Ensemble sum floating-point half zero 


c ci IM F 19 


Ensemble sum floating-point single 


c qi iM c oo p 

C.OUIVI.r .O^.V^/ 


Ensemble sum floating-point single ceiling 


E SUM F 32 F 


Ensemble sum floating-point single floor 


E.SUM.F.32.N " 


Ensemble sum floating-point single nearest 


E.SUM.F.32.X 


Ensemble sum floating-point single exact 


E.SUM.F.32.Z 


Ensemble sum floating-point single zero 
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r— rti ill CCA 

E.SUM.F.64 


Pncpmhlfi Qum floatinn-ooint doubls 


p— o 1 1 ft a r~ C A i 

E.SUM.F.04.0 


Fncpmhle sum floatinn-ooint double ceilino 


E.SUIvl.F.64.r 


Pncpmhlp sum float inn-ooint double floor 
ullociiiuio oum imam ly-puii ii uuuuio iiwi 


E.SUM.F.64.N 


Pncpmhlp Qiim float! nn-noint double nAafPct 


E.SUM.F.64.X 


Pncpmhlp Qiim flnatinn-nnint donhlp pxart 


f— /> i 1 ft « i— /> j -7 

E.SUM.F.64.Z 


Pncpmhlp cum flnatinn-noint douhlA 7Pro 
a loci i luio out ii iiudiii ly-pwii u uuuuid &ciu 


r— o 1 1 ft 4 P" A nn 

E. SUM. F. 128 


Pncpmhlp ci im float inn-nnint niiad 
diotzuiuio out ii iiuciui iy-^Aju ii tjuau 


i— oi i ft j r - a no a> 

E.SUM.F.128.C 


Pncomhlo cnm flnatinn.nnint niiad rpilinn 
ClioclMUiU ouin nualll iy~|AJH ii mJavj uciuiiy 


P Ql IM P 19ft P 
EZ.OUlvl.r. I^O.r 


Ensemble sum floating-point quad floor 


E.SUM.F.128.N 


Ensemble sum floating-point quad nearest j 


E.SUM.F.128.X 


Ensemble sum floating-point quad exact 


E.SUM.F.128.Z 


Ensemble sum floating-point quad zero 



Selection 





op 


prec 


round/trap 


copy 


COPY 


16 32 64 128 


NONE X 


absolute 
value 


ABS 


16 32 64 128 


NONE X 


float from 
integer 


FLOAT 


16 32 64 128 


noneCFNXZ 


integer 
from float 


SINK 


16 32 64 128 


NONE C F N X Z 
C.DF.DZ.D 


increase 

format 

precision 


INFLATE 


16 32 64 


NONE X 


decrease 

format 

precision 


DEFLATE 


32 64 128 


NONE C F N X Z 


negate 


NEG 


16 32 64 128 


NONE X 


reciprocal 
estimate 


RECEST 


16 32 64 128 


NONE X 


reciprocal 
square root 
estimate 


RSQREST 


16 32 64 128 


NONE X 


square root 


SQR 


16 32 64 128 


NONE C F N X Z 


sum 


SUM 


16 32 64 128 


NONE C F N X Z 
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Format 

E.op.prec.round rd=rc 
rd=eopprecround(rc) 

31 24 23 18 17 12 11 6 5 0 

I E.prec | rd | rc | op | E.UNARY I 

8 6 6 6 6 



Fig. 41 B 



Definition 

def EnsembleUnaryFloatingPoint(op,prec,round,rd,rc) as 
c <- RegRead(rc, 128) 
case op of 

E.ABS.F, E.NEG.F, E.SQR.F: 
for i <r- 0 to 128-pr c by prec 

ci<~F(prec ( Ci +P rec-1.j) 
case op of 

E.ABS.F: 

ai.t «- ci.t 

ai.s <- 0 

ai.e <- ci.e 

ai.f <- ci.f 
E.COPY.F: 

ai <-ci 
E.NEG.F: 

ai.t <- ci.t 

ai.s -ci.s 

ai.e «- ci.e 

ai.f <- ci.f 
E.RECEST.F: 

ai <- frecest(ci) 
E.RSQREST.F: 

ai <- frsqrest(ci) 
E.SQR.F: 

ai <- fsqr(ci) 

endcase 

ai+prec-1..i <- PackF(prec, ai, round) 
endfor 
E.SUM.F: 

p[0].t <r- NULL 

for i <r- 0 to 128-prec by prec 

p[i+prec] <- fadd(p[i], F(prec,Cj+ pr ec-1..i)) 
endfor 

a <- PackF(prec, p[128], round) 
E.SINK.F: 

for i <~ 0 to 128-prec by prec 
ci<-F(prec,Ci +P rec-1..i) 
ai+prec-1..i <- fsinkr(prec, ci, round) 
endfor 
E.FLOAT.F: 

for i <r- 0 to 128-prec by prec 

ci.t <- NORM 
' "ri.e <- 0 

ci.s Cj+prec-t 

ci.f <r- ci.s ? 1 +~Cj +pre c-2..i : Ci+prec-2..i 
ai+prec-L.i «- PackF(prec, ci, round) 
endfor 

Fig. 41 C 



E.INFLATE.F: 

for i 0 to 64-prec by prec 
ci^F(prec,Cj +pre c-l..i) 

ai+i+prec+prec-1..i+i «- PackF(prec+prec, ci, round) 
endfor 
E.DEFLATE.F: 

for i ^- 0 to 128-prec by prec 

ci<-F(prec t Ci +P rec-1..i) 

ai/2+prec/2-1..i/2 «- PackF(prec/2, ci, round) 
endfor 
ai27..64<-0 

endcase 

RegWritefrd, 128, a] 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 41C (cont'd) 



E.MULG.8 


Ensemble multiply Galois field byte 


E.MULG.64 


Ensemble multiply Galois field octlet 



Fig. 42A 



Format 

E.MUL.G.size ra=rd,rc,rb 
ra=emulgsize(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

f E.MUL.G.size | rd | rc | rb | ra | 

8 6 6 6 6 



Fig.42B 



Definition 

def c <- PolyMultiply(size,a,b) as 

p[0] <- o 2#size 

for k <- 0 to size-1 

p[k+1] <- p[k] A a k ? (0 sjz ^ k || b || 0 k ) : 0 2 * size 

endfor 

c<- p[size] 
enddef 

def c <- PolyResidue(size,a,b) as 
p[0] <- a 

for k <r- size-1 to 0 by -1 

PlK+1] +- PM a PtOWk ? (0 size " k I1 1 1 II b || 0 k ) : C)2*size 
endfor 

c<-p[size] S jze-1..0 
enddef 

def EnsembleTemaryfop.size.rd.rc.rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 

E.MULG: 

for i <- 0 to 128-size by size 

asize-1+i.J <- Poly R esidue(size,PolyMul(size f c S i2e-1+LJ.bsize-1+ 
endfor 

endcase 

RegWrite(ra, 128, a) 
enddef 



Exceptions 

none 



Fig. 42C 
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127 



rc(128) 



rb(8) 



128 



ra(128) o 
Ensemble multiply Galois field bytes 
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X C0MPRESS.2 


Crossbar compress signed pecks 


X C0MPRESS.4 


Crossbar compress signed nibbles 


X C0MPRESS.8 

W X • X*^ X*^ If II 1 X b« X*^ • X^ 


Crossbar compress signed bytes 


X C0MPRESS.16 


Crossbar compress signed doublets 


X COMPRESS.32 

XX* X*^ If 1 1 1 X X*^ ■ X^^» 


Crossbar compress signed quadlets 


X COMPRESS 64 

✓ \ • \^ \^ 1 V 1 1 I x^_x^x^>v • 


Crossbar compress signed octlets 


X COMPRESS 128 


Crossbar compress signed hexlet 


X COMPRESS U 2 

XX»X^Xj^I¥fl ■ X ^™ Xi^ X^ • Xi^ • fc» 


Crossbar compress unsigned pecks 


X COMPRESS U.4 


Crossbar compress unsigned nibbles 


X COMPRESS U 8 

/»i Willi 1 X ^» X,^ X»^ » X^ • X^ 


Crossbar compress unsigned bytes 


X.C0MPRESS.U.16 

X X » If II • X %^ %^ * • 1 X^ 


Crossbar compress unsigned doublets 


X COMPRESS.U.32 


Crossbar compress unsigned quadlets 


X COMPRESS U 64 

/ \t V/W If II 1 X^»X^ X^ » » X^ 1 


Crossbar compress unsigned octlets 


X COMPRESS U 128 


Crossbar compress unsigned hexlet 


X EXPAND 2 


Crossbar expand signed pecks 


X EXPAND 4 


Crossbar expand signed nibbles 


X EXPAND 8 


Crossbar expand signed bytes 


X EXPAND 16 

X X» \l t XI f X^ • 1 V-/ 


Crossbar expand signed doublets 


X EXPAND 32 


Crossbar expand signed quadlets 


X EXPAND 64 


Crossbar expand signed octlets 


X EXPAND 128 

r X • XI # 1l 1 • 1 vx 


Crossbar expand signed hexlet 


X EXPAND U 2 


Crossbar expand unsigned pecks 


X EXPAND U 4 

X X ■ # X 1 f XI iWiWl F 


Crossbar expand unsigned nibbles 


X.EXPAND.U.8 


Crossbar expand unsigned bytes 


X.EXPAND.U.16 


Crossbar expand unsigned doublets 


X.EXPAND.U.32 


Crossbar expand unsigned quadlets 


X.EXPAND.U.64 


Crossbar expand unsigned octlets 


X.EXPAND.U.128 


Crossbar expand unsigned hexlet 


X.R0TL2 


Crossbar rotate left pecks 


X.R0TL.4 


Crossbar rotate left nibbles 


X.R0TL8 


Crossbar rotate left bytes 


X.R0TL16 


Crossbar rotate left doublets 


X.ROTL.32 


Crossbar rotate left quadlets 


X.ROTL.64 


Crossbar rotate left octlets 


X.ROTL128 


Crossbar rotate left hexlet 


X.R0TR.2 


Crossbar rotate right pecks 


X.R0TR.4 — 


Crossbar rotate right nibbles 


X.R0TR.8 


Crossbar rotate right bytes 


X.R0TR.16 


Crossbar rotate right doublets 
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X ROTR 32 


Crossbar rotate riaht auadlets 


X ROTR 64 


Crossbar rotate riaht octlets 


X ROTR 128 


Crossbar rotate riaht hexlet 

^^l www vUl i >^W*fcW 1 '^4* »* * iw^«w» 


X SHI 2 


Crossbar shift left Decks 

>✓! WWWWWl Wl III 1 IwlV WWWI»W 


X SHL 2 O 


Crossbar shift left sinned Decks check overflow 

V/l Vwwl/Ql wl III I ICI 1 Oly 1 IvVI p\*wl\w VI 1 v vi\ W V wl ■ I W» 


X SHL 4 


Crossbar shift left nibbles 

WW W MVII Wl 1 1 1 * I 1 % III WW! WW 


X SHL 4 O 


Hrnsshar shift left sinned nibbles check overflow 


X SHL 8 

A.OnL.O 


Crossbar shift left bvtes 

V*' 1 Vww WU 1 wl III I Ivll WTlW 


X SHL 8 O 

A.OllL.O.VJ 


Crosshar shift left sinned bvtes check overflow 

vIODwUCII Olllll Ivl I Ol^l Iwvi UyiCO wl ICvIX UVvlllvn 


X SHL 16 

A.wl 1 L. > 1 w 


Crossbar shift left doublets 


X SHL 16 O 


Crosshar shift left sinned doublets check overflow \ 

VlwwwL/QI wl III i Iwll OIUI Iww VlVUk/lww Wl IwwrV w V wl 1 IWif 


X SHL 32 


Crossbar shift left auadlets 

Wvwk/UI Wl III 1 IWI % UVIVIVIIwkW 


X SHL 32 O 


Crosshar shift left sinned nuadlets check overflow 

V-/I wOOwCll Olllll Ivl I Ol^l IwU UjUCIwlwlO wl lOwlX W V wl 1 IWW 


X SHL 64 

AiUl ii—. w~ 


Crossbar shift left octlets 


X SHL 64 O 


Crosshar shift left sinned octlets check overflow 

wl UOOUCII Olllll Iwll Olwl ICU vvUvlw wl IwwrV WVwIIIWVV 


X SHL 128 


Crossbar shift left hexlet 

\m* 1 VwwUvll Wl HIV IWI V 1 IVAIVt 


X SHL 128 O 


Crossbar shift left sinned hexlet check overflow 

Vl UwwwCII Olllll Iwll wlwl Iww 1 IwAlv 1 Wl IwWrV vivl IIWTf 


X SHL U 2 O 


Crosshar shift left unsioneri necks check overflow 

wlUOdUal Olllll Iwll Ul Iwlwl IwSJ wwWrVw wl 1 wwlV W V wl llvll 


X SHL LJ 4 O 


f^rnsshar shift left unsinned nihhles check overflow 

vslwwOwGI Olllll Iwll LJ 1 lOlw 1 ICU 1 llwwlww wl IwwrV WvwIllwVV 


X SHL U 8 O 


Crosshar shift left unsinned bvtes check overflow 

wl UOOUul Olllll Iwll VJI Iwiyi Iww wj Vww wl IwwrV wyvMIWti 


X SHL U 16 O 


HrnQQhar shift left unsinned dnuhlets check overflow 

wl UOdUCII Olllll Iwll Ul IOIVJI Iww UOUUIvlO wl IwwrV WW llwif 


X SHL U 32 O 


f^roQQhar Qhift left unsinned nuadlets check overflow 

V/l vdOUdl Olllll Iwll UIIOIwJIww ^UuUivld wl IwwrV WvwIllwVV 


X SHL U 64 O 

A.VJI 11-. W . w*T. V-/ 


Crossbar shift left unsinned octlets check overflow 

vl vOOUCI Olllll Iwll Ul IOIUI IwU Wwllwlw wl IwwrV WVWIIIWVV 


X SHI U 128 O 


rtrnQQhar shift left unsinned hexlet check overflow 

vl WOOl/QI Olllll ICI I Ul 'Oiy 1 Iww 1 IwAlvl wl IwwrV WV wl IIWVV 


X SHR 2 


Crossbar sianed shift riaht Decks 

v^l wwwwdl wIVJI Iww wl HIV. 1 1*^ 


X SHR 4 

A.onrx.t 


Crosshar sianed shift riaht nibbles 

WWW WW 1 vlM 1 IWW Willie 1 'jj* * » 1 1 1 W W IWW 


X SHR 8 


Crossbar sianed shift riaht bvtes 

\*S 1 VWV W wl 1 WlW 1 IWW Wl Mil I Im 1 1 % W T IV w 


X SHR 16 

A.onrx. 1 w 


Crossbar sianed shift riaht doublets 

^mf* WWWWWl WlWI IWW Wl 111% ■ iVfl 1* WVWMIWltf 


X SHR 32 


Crossbar sianed shift riaht auadlets 


X SHR 64 


Crossbar sianed shift riaht octlets 

V( VVW Vvl 1 WlMI IWW Wl II 1 % 1 1 Wf * 1 » W WH W %W 


X SHR 128 

A.onr\. i 


Crossbar sianed shift riaht hexlet 

N«/ 1 WwwwGII WlUI IwU wl HIV 1 IM 1 11 1 IvAIw V 


X SHR U 2 

A.OI 1 1 \ . \J • Cm 


Crossbar shift riaht unsianed Decks 

V^l X^WWWWCI Wl III % 1 *23 1 W ■ >J 1 IWW WWW! »w 


X SHR I J 4 


Crossbar shift riaht unsianed nibbles 

\m/ 1 Wwwwdl Wl III i 1 IM 1 11 VI 1 IwImI Iww 1 IIWWIWW 


X.SHR.U.8 


Crossbar shift right unsigned bytes j 


X.SHR.U.16 


Crossbar shift right unsigned doublets 


X.SHR.U.32 


Crossbar shift right unsigned quadlets 


X.SHR.U.64 


Crossbar shift right unsigned octlets 


X.SHR.U.128 


Crossbar shift right unsigned hexlet 



Fig. 43A (cont'd) 



Selection 



class 


op 


size 


precision 


EXPAND EXPAND.U 
COMPRESS 

COMPRESS. 

U 


2 4 8 16 32 64 128 


shift 


ROTR ROTL SHR SHL 
SHL.O SHL.U.O 
SHR.U 


2 4 8 16 32 64 128 



Format 

X.op.size rd=rc,rb 
rd=xopsize(rc,rb) 

31 252423 18 17 12 11 6 5 21 0 

I XSHIFT |s| rd I rc I rb | op | sz | 

7 1 6 6 6 4 2 

Isize <- log(size) 
s «- Isize2 
sz<- Isizei.o 

Fig. 43B 



Definiti n 

def Crossbar(op,size,rd,rc,rb) 
c «- RegRead(rc f 128) 
b <- RegRead(rb, 128) 
shift <- b and (siz -1) 
case ops.,2 || 0 2 of 
X.COMPRESS: 
hsize <- size/2 
for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

a|+hsize-1..i <- Ci+i+shitt+hsize-1 J+i+shift 

else 

ai+hsize-1..i <- <f+^"fee?f II Ci+i+size-1..i+i+shitt 

end if 
endfor 
ai27..64<-0 
X.COMPRESS. U: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift ^ hsize then 

aj+hsize-U «- c i+i+shift+hsize-1..i+i+shift 

else 

aj+hsize-1..i «- 0 shift - hslze || q+j+ S ize-1..i+i+shift 

end if 
endfor 
ai27..64<-0 
X.EXPAND: 

hsize «- size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

an+size-1 J+i <- cUftBJf || Cj+hsize-1 ..i II 0 shift 

else 

aw+size-1..i+i <- c i+size-shift-1 ..i II ° shifl 

end if 
endfor 
X.EXPAND.U: 

hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift £ hsize then 

aw+size-1..W «- Ohsize-shift || c Khsize .i j II 0*« 

else 

• — . aj+i+sjze-1 ..j+j <- Ci+size-shift-1 ..ill ° shift 

end if 
endfor 
X.ROTL: 

for i <- 0 to 128-size by size 

aj+size-1..i <- Cj+ S ize-1 -shift.. i II Cj+size-1..i+size-1 -shift 
endfor 



Fig. 43C 



X.ROTR: 

fori 4-0 to 128-siz bysiz 

aj+size-1 ..i <- Cj +S hjfl-1 ..ill Cj+ S ize-1 ..i+shift 
endfor 
X.SHL: 

for i <- 0 to 128-size by size 

aj+size-1. J «- q+size-1 -shift..! II 0 shift 
endfor 
X.SHL.O: 

for i <- 0 to 128-size by size 

if Cj+size-1 ..i+size-1-shift * ^sizell-shift then 
raise FixedPointArithmetic 

endif 

aj+size-1. J «- C}+ S j Z e-i-shifUll 0 shift 
endfor 
X.SHLU.O: 

for i +- 0 to 128-size by size 

if Cj+size-U+size-shift * 0 shift then 
raise FixedPointArithmetic 

endif 

aj+size-1. .i «- Cj+size-1-shifull 0 shift 
endfor 
X.SHR: 

for i +- 0 to 128-size by size 

aj+size-1. .i «- cf+ h <!|e-1 II c i+size-1..i+shifl 
endfor 
X.SHR.U: 

for i <- 0 to 128-size by size 

aj+size-1 .J «- 0 shlft II c i+size .i j+shift 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 43C (cont'd) 



i 1 taltii 1 lit 


mi 1 t 11 1 II i 






mm 





Compress 32 bits to 16, with 4-bit right shift 
Fig. 43D 



Operati nc des 



X.SHL.M.2 


Crossbar shift left merge pecks 


X.SHL.M.4 


Crossbar shift left merge nibbles 


X.SHLM.8 


Crossbar shift left merge bytes 


X.SHL.M.16 


Crossbar shift left merge doubl ts 


X.SHL.M.32 


Crossbar shift left merge quadlets 


X.SHL.M.64 


Crossbar shift left merge octlets 


X.SHL.M.128 


Crossbar shift left merge hexlet 


X.SHR.M.2 


Crossbar shift right merge pecks 


X.SHR.M.4 


Crossbar shift right merge nibbles 


X.SHR.M.8 


Crossbar shift right merge bytes 


X.SHR.M.16 


Crossbar shift right merge doublets 


X.SHR.M.32 


Crossbar shift right merge quadlets 


X.SHR.M.64 


Crossbar shift right merge octlets 


X.SHR.M.128 


Crossbar shift right merge hexlet 



Flg.43E 



Format 



X.op.size rd@rc,rb 
rd=xopsize(rd,rc,rb) 

31 252423 18 17 12 11 6 5 21 

I XSHIFT |s| rd | rc | rb I op 

7 1 6 6 6 4 

Isize <- log(size) 
s Isize2 
sz<- lsizei..o 



Definition 

def Crossbarlnplace(op,size,rd,rc,rb) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
shift <-b and (size-1) 
for i «- 0 to 128-size by size 
case op of 
X.SHR.M: 

ai+size-1..i «- Ci+shift.1..i II dj+ S ize-1..i+shift 
X.SHLM: 

ai+size-1..i «- dj+size-1 -shift..! II Cj+ S hift-1..i 

endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 



Fig 43G 



Operation codes 



X.COMPRESS.1.2 


Crossbar compress immediate signed pecks 


X.COMPRESS.1.4 


Crossbar compress immediate signed nibbles 


X.C0MPRESS.I.8 


Crossbar compress immediate signed bytes 


X.C0MPRESS.I.16 


Crossbar compress immediate signed doublets 


X.COMPRESS.I.32 


Crossbar compress immediate signed quadlets 


X.COMPRESS.I.64 


Crossbar compress immediate signed octlets 


X.COMPRESS.1.128 


Crossbar compress immediate signed hexlet 


X.COMPRESS.I.U.2 


Crossbar compress immediate unsigned pecks 


X.COMPRESS.I.U.4 


Crossbar compress immediate unsigned nibbles 


X.C0MPRESS.I.U.8 


Crossbar compress immediate unsigned bytes 


X.C0MPRESS.I.U.16 


Crossbar compress immediate unsigned doublets 


X.COMPRESS.I.U.32 


Crossbar compress immediate unsigned quadlets 


X.COMPRESS.I.U.64 


Crossbar compress immediate unsigned octlets 


X.COMPRESS.I.U.128 


Crossbar compress immediate unsigned hexlet 


X.EXPAND.I.2 


Crossbar expand immediate signed pecks 


X.EXPAND.I.4 


Crossbar expand immediate signed nibbles 


X.EXPAND.I.8 


Crossbar expand immediate signed bytes 


X.EXPAND.1.16 


Crossbar expand immediate signed doublets 


X.EXPAND.I.32 


Crossbar expand immediate signed quadlets 


X.EXPAND.I.64 


Crossbar expand immediate signed octlets 


X.EXPAND.1.128 


Crossbar expand immediate signed hexlet 


X.EXPAND.I.U.2 


Crossbar expand immediate unsigned pecks 


X.EXPAND.I.U.4 


Crossbar expand immediate unsigned nibbles 


X.EXPAND.I.U.8 


Crossbar expand immediate unsigned bytes 


X.EXPAND.I.U.16 


Crossbar expand immediate unsigned doublets 


X.EXPAND.I.U.32 


Crossbar expand immediate unsigned quadlets 


X.EXPAND.I.U.64 


Crossbar expand immediate unsigned octlets 


X.EXPAND.I.U.128 


Crossbar expand immediate unsigned hexlet 


X.ROTL.I.2 


Crossbar rotate left immediate pecks 


X.ROTL.I.4 


Crossbar rotate left immediate nibbles 


X.R0TL.I.8 


Crossbar rotate left immediate bytes 


X.ROTL.1.16 


Crossbar rotate left immediate doublets 


X.ROTL.I.32 


Crossbar rotate left immediate quadlets 


X.ROTL.I.64 


Crossbar rotate left immediate octlets 


X.ROTL.1.128 


Crossbar rotate left immediate hexlet 


X.ROTR.I.2 


Crossbar rotate right immediate pecks 


X.ROTR.M — - 


Crossbar rotate right immediate nibbles 


X.ROTR.I.8 


Crossbar rotate right immediate bytes 


X.ROTR.1.16 


Crossbar rotate right immediate doublets 


X.ROTR.1.32 


Crossbar rotate right immediate quadlets 


X.ROTR.1.64 


Crossbar rotate right immediate octlets 


X.ROTR.1.128 


Crossbar rotate right immediate hexlet 



Fig. 43H 



V/ A III 1 s*\ 

X.SHLI.2 


Crossbar shift left immediate pecks 


V/ 1 II 1 o 

X.SHL.I.2.0 


orossoar snin len immeaiaie signeo pecKs check ovemow 


W O 1 II | J 

X.SHL.1.4 


urossoar snin ien immediate mooies 


w o I 1 1 I a /-\ 

X.SHLI.4.0 


orossDar snin ien immeaiaie signeo mooies cnecK ovemow 


v/ o iii in 

X.SHL.1.8 


urossoar snin ien immediate oytes 


X.SHL.1.8. 0 


urossDar snin ien immediate signed oytes check overflow 


X.SHLI.16 


orossoar snin ien immediate dou Diets 


V/ 1 II 1 4 /> 

X.SHLI.16.0 


Crossbar shift left immediate signed doublets check overflow 


X.SHL.1.32 


orossoar snin ien immediate quadlets 


X.SHLI.32.0 


Crossbar shift left immediate signed quadlets check overflow 


X.SHLI.64 


urossoar snin ien immediate octiets 


X.SHL.I.64.0 


Crossbar shift left immediate signed octiets check overflow 


X.SHLI.128 


urossoar snin ien immediate nexiet 


X.SHLI.128.0 


Crossbar shift left immediate signed hexlet check overflow 


X.SHL.I.U.2.0 


Crossbar shift left immediate unsigned pecks check overflow 


X.SHLI.U.4.0 


Crossbar shift left immediate unsigned nibbles check overflow 


v/ ("Mil i i i o /""\ 

X.SHL.I.U.8.0 


Crossbar shift left immediate unsigned bytes check overflow 


V/ Ol II 1 1 1 A f> /"N 

X.SHLI.U.16.0 


Crossbar shift left immediate unsigned doublets check overflow 


V/ 0 1 II III oo 

X.SHL.I.U.32.0 


Crossbar shift left immediate unsigned quadlets check overflow 


V/ /^l II III A /™\ 

X.SHLI.U.64.0 


Crossbar shift left immediate unsigned octiets check overflow 


v/ oi II III 4 

X.SHL.I.U. 128.0 


Crossbar shift left immediate unsigned hexlet check overflow 


v/ o i i n i ^> 

X.SHR.1.2 


Crossbar signed shift right immediate pecks 


v ai m i a 

X.SHR.1.4 


Crossbar signed shift right immediate nibbles 


V/ O 1 1 f\ 1 rt 

X.SHR.1.8 


Crossbar signed shift right immediate bytes 


w oil 1™* 1 ^ /*> 

X.SHR.1.16 


Crossbar signed shift right immediate doublets 


X.SHR.1.32 


Crossbar signed shift right immediate quadlets 


V/ ai m | f> A 

X.SHR.1.64 


Crossbar signed shift right immediate octiets 


X.SHR.1.128 


Crossbar signed shift right immediate hexlet 


w o i in i i i o 

X.SHR.I.U.2 


Crossbar shift right immediate unsigned pecks 


v/ oil r™\ i i i a 

X.SHR.I.U.4 


Crossbar shift right immediate unsigned nibbles 


V CUP IMA 

A.onK.I.U.o 


r^rnQQKar chift rinht immpHisfp imcinnoH Hv/ta^ 
v^iuoouai 91 hi i iiyin ii i ii i icutdic uiioiyiicu uyico 


X.SHR.I.U.16 


Crossbar shift right immediate unsigned doublets 


X.SHR.I.U.32 


Crossbar shift right immediate unsigned quadlets 


X.SHR.I.U.64 


Crossbar shift right immediate unsigned octiets 


X.SHR.I.U.128 


Crossbar shift right immediate unsigned hexlet 



Fig. 43H (cont) 



Select! n 



class 


op 


size 


precision 


COMPRESS.I 

PHMPRPQ^ 1 1 1 FYPANn 1 
KsKJfVlr rxCOO.I.U CArnlNU.I 

EXPAND.I.U 


2 4 8 16 32 64 128 


shift 


ROTL.I ROTR.I 
SHLI SHL.I.O 
SHL.I.U.O 
SHR.I SHR.I.U 


2 4 8 16 32 64 128 


copy 


COPY 





Format 



X.op.size rd=rc,shift 
rd=xopsize(rc,shift) 

31_ 24 23 18 17 12 11 65 0 

I XSHIFTI | rd | rc I simm | op | 

8 6 6 6 6 



1 4- 256-2*size+shift 

OP1..0 <~t7..6 

simm <- t5..o 



Fig. 43! 



Definiti n 



def CrossbarShortlmmediate(op,rd,rc,simm) 
cas (opi..o ||simm)of 



0..127: 




size 


<- 128 


A OO A f\A . 

128.. 191: 




size 


4- 64 


A f\*\ AAA . 

192. .223: 




size 


4-32 


224..239: 




size 


4- 16 


240..247: 




size 


<-8 


248-251: 




size 


<-4 


252..253: 




size 


<-2 


254..25S: 





raise Reserved Instruction 

endcase 

shift <- (opo || simm) and (size-1) 
c 4- RegRead(rc, 128) 
case (0P5..2 II 0 2 ) of 
X.COMPRESSJ: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift <, hsize then 

ai+hsize-1..i <- Cj+j+ S hift+hsize-1..i+i+shitt 

else 

ai+hsize-1..i «- <^]+s&IkP H Ci+i+size-1..i+i+shift 

endif 
endfor 
ai27..64<-0 
X.COMPRESS.I.U: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift <, hsize then 

ai+hsize-1..i «- Ci+|+shift+hsize-1..i+i+shift 

else 

ai+hsize-1 ..i <- 0 8hift - hsbe || q+i+size-1 ..i+i+shift 

endif 
endfor 
ai27^64<-0 



Fig. 43J 



X.EXP AND. I: 

hsize «- size/2 
for i <r- 0 to 64-hsize by hsize 
if shift shsiz then 

ai +i+ size-1..W «- cfei h f II c l+hS j ze -i..j II 0*« 

else 

ai+i+size-L-i+i *r Cj +S i Z e-shift.1..i II ° shlft 

endif 
endfor 
X.EXP AND. I.U: 
hsize <- size/2 
for i 0 to 64-hsize by hsize 
if shift £ hsize then 

aw +S ize-1..W <- O^size-shift || c i+hsize . 1 .j || 0*™ 

else 

ai+j+size-1..i+i «- C|+size-shift-1..i || 0 shlft 

endif 
endfor 
X.SHLI: 

for i «- 0 to 128-size by size 

aj+size-1..i «- Cj+size-1-shlftJll 0 shifl 
endfor 
X.SHLI.O: 

for i <- 0 to 128-size by size 

if Cj+size-1 J+size-1-shift * <f4*eh1-shift men 
raise FixedPointArithmetic 

endif 

ai +S i Z e-i j <- q +S ize-l-shift..ill 0 shifl 
endfor 
X.SHL.I.U.O: 

for i <- 0 to 1 28-size by size 

if Cj+size-1 ..i+size-shift * 0 shift then 
raise FixedPointArithmetic 

endif 

ai+size-1..i «- Cj+size-1 -shift.ill 0 shm 
endfor 

Fig. 43J (cont) 



X.ROTR.I: 

for i <- 0 to 1 28-size by siz 

ai+size-1..i «- Cj +s hift-1.j II Cj+size-1..i+shift 
endfor 
X.SHR.I: 

for i <- 0 to 1 28-size by siz 

ai+size-1..i «- II c i+stze-1.J+shlft 

endfor 
X.SHR.I.U: 

for i <- 0 to 1 28-size by size 

aj+size-1..i <- 0 shjft || c i+sl2e . 1 J+Shm 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 
Reserved Instruction 

Fig. 43J (cont) 



Operation codes 



X.SHL.M.1.2 


Crossbar shift left merge immediate pecks 


X.SHL.M.1.4 


Crossbar shift left merge immediate nibbles 


X.SHL.M.1.8 


Crossbar shift left merge immediate bytes 


X.SHLM.1.16 


Crossbar shift left merge immediate doublets 


X.SHL.M.I.32 


Crossbar shift left merge immediate quadlets 


X.SHLM.I.64 


Crossbar shift left merge immediate octlets 


X.SHLM.1.128 


Crossbar shift left merge immediate hexlet 


X.SHR.M.I.2 


Crossbar shift right merge immediate pecks 


X.SHR.M.I.4 


Crossbar shift right merge immediate nibbles 


X.SHR.M.I.8 


Crossbar shift right merge immediate bytes 


X.SHR.M.1.16 


Crossbar shift right merge immediate doublets 


X.SHR.M.I.32 


Crossbar shift right merge immediate quadlets 


X.SHR.M.I.64 


Crossbar shift right merge immediate octlets 


X.SHR.M.1.128 


Crossbar shift right merge immediate hexlet 



Fig 43K 



Format 



X.op.size rd@rc,shift 
rd=xopsize(rc,shift) 

31 24 23 18 17 12 11 6 5 0 

I XSHIFTI I rd I rc | simm I op I 

8 6 6 6 6 

t <- 256-2*size+shift 
opi..o*-t 7 „ 6 
simm <- t 5 ..o 



Fig 43L 



Definition 

def CrossbarShortlmmediatelnplacefap.rd/c.simm) 
case (opi..o ||simm) of 



0..127: 




size 


<- 128 


128..191: 




size 


*- 64 


192..223: 




size 


<-32 


224..239: 




size 


<- 16 


240..247: 




size 


<-8 


248..251: 




size 


<-4 


252.-253: 




size 


<- 2 


254..255: 





raise Reserved Instruction 

endcase 

shift <- (opo || simm) and (size-1 ) 
c <- RegRead(rc, 128) 
d <- RegRead(rd, 128) 
for i <- 0 to 128-size by size 
case (OP5..2 || 0 2 )of 
X.SHR.M.I: 

ai+size-1..i «- Cj +S hift-1..i II di+size-1..i+shift 
X.SHLM.I: 

a i+size-1..i <- di+size-1-shift..i II c i+shift-1..i 

endcase 
endfor 

RegWrite(rd f 128, a) 
enddef 

Exceptions 

Reserved Instruction 

Fig43M 



Format 



X. EXTRACT ra=rd,rc,rb 
ra=xextract(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 

I op I rd | rc | rb | ra 

8 6 6 6 6 



Fig. 44A 



Definition 



def CrossbarExtract(op,ra,rb,rc t rd) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case b8..o of 



0..255: 




gsize 4- 


128 


25B..383: 




gsize <- 


64 


384.447: 




gsize <- 


32 


448..479: 




gsize <- 


16 


480..495: 




gsize 4- 


8 


496..503: 




gsize 4- 


4 


504..507: 




gsize 4- 


2 


508..511: 




gsize 4- 


1 



end case 
m <- b-|2 

as4-signed<-bi4 
h <- (2-m)*gsize 

spos <- (b8..o) and ((2-m)*gsize-1) 
dpos 4- (0 || b23..i6) and (9Size-1) 
sfsize 4- (0 || b3i„24) and (gsize-1) 

tfeize <- (sfsize = 0) or ((sfsize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize 4- (tfsize + spos > h) ? h - spos : tfsize 
for i 4- 0 to 128-gsize by gsize 
case op of 

X. EXTRACT: 
if m then 

P<-<*gsize+M..i 

else 

P4-(d|| c)2*(g S ize+iM..2*i 

endif 

endcase 

v4-(as&p h -i)||p 

w 4- (as & Vspo S+ feize.l) 9Size - feizeKlpos II vfsize-1+spos..spos II 
if m then 

a size-1+U «- Cgsize-l+Ldpos+fsize+i II w dpos+fsize-1..dpos II Cdpos-I+L.i 

eise 

a size-1+U<~ w 

endif 

endfor 

RegWrite(ra, 128, a) 
enddef 



Exceptions 

none 



Fig. 44B 



< — fstee — >« dpos 
Crossbar extract 

Fig. 44C 



< — feizo — x opoo 




< — fsiz e — >< dpos 
Crossbar merge extract 



Fig. 44D 



Operation codes 



E.MUL.X 


Ensemble multiply extract 


E.EXTRACT 


Ensemble extract 


E.SCAL.ADD.X 


Ensemble scale add extract 



Fig. 44E 



Format 

E.op ra=rd,rc,rb 
ra=eop(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I op I rd | rc | rb | ra | 

8 6 6 6 6 



Fig. 44F 



def mul(size t h,vs,v,i.ws f w,j) as 

mul <- ((vs&v s ize-1+i) h " size II v S ize-1H.i) * ((ws&w siz e-l + j) h - slze II w S j 2e -i + j..j) 
enddef 

def EnsembleExtracUop.ra^rc.rd) as 
d <- RegRead(rd, 128) 
c<- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case b8..o of 
0..255: 

sgsize <- 128 
2S6..383: 

sgsize <- 64 
384..447: 

sgsize <- 32 
448..479: 

sgsize*- 16 
480..495: 

sgsize <- 8 
496..503: 

sgsize <- 4 
504..507: 

sgsize <- 2 
508..511: 

sgsize <- 1 

endcase 
i^-bn 

m <— b-|2 
n<-bi3 
signed <- b-|4 
case op of 

E. EXTRACT: 

gsize <- sgsize 

h <- (2-m)*gsize 

as <- signed 

spos <- (b8..o) and ((2-m)*gsize-1) 
E.SCALADD.X: 

if (sgsize < 8) then 

gsize*- 8 
elseif (sgsize*(n+1) > 32) then 
gsize <-32/(n+1) 

else 

gsize <- sgsize 

endif 

ds <=cs <- signed 

bs <- signed A m 

as <- signed or m or n 

h <- (2*gsize) + 1 + n 

spos <- (b8..o) and (2*gsize-1) 

Fig. 44G 



E.MUL.X: 

if (sgsiz <8)th n 

gsize <- 8 
elseif (sgsize*(n+1) > 128) then 

gsize «- 128/(n+1) 

els 

gsiz sgsiz 

endif 

ds <- signed 

cs +- signed A m 

as <- signed or m or n 

h <- (2*gsize) + n 

spos <- (ba..o) and (2*gsize-1 ) 

endcase 

dpos <r- (0 || b23..16) a nd (gsize-1) 
r <- spos 

sfsize <- (0 || b3i ..24) and (gsize-1 ) 

tfsize *- (sfsize = 0) or ((sfsize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize <- (tfsize + spos > h) ? h - spos : tfsize 
if (b<io..9 = Z) and not as then 
rnd <- F 

else 

rnd bio..9 

endif 

for i <- 0 to 1 28-gsize by gsize 
case op of 

E.EXTRACT: 
if m then 

P<-d gs ize+i-1..i 

else 

p«-(d ||c)2*(gsize+i)-1..2*i 

endif 
E.MULX: 
if n then 

if (i and gsize) = 0 then 

p <- muKgsize.h.ds.d.i.cs.c.i) - mul(gsize,h,ds,d,i+size,cs f c,i+size) 

else 

p 4- muKgsize.h.ds.d^cs.c.i+size) + muKgsize.h.ds.dj.cs.c.i+size) 

endif 

else 

p <- mul(gsize,h,ds,d J.cs.cj) 

endif 



Fig. 44G (cont) 



E.SCALADD.X: 
if n then 

if(iandgsiz ) = Othen 

p <- mul(gsize,h f ds f d ( i,bs,b t 64+2*gsize) 
+ muKgsize.h.cs.ci.bs.b.M) 
-mul(gsiz ,h l ds,d t i+gsize I bs,b,64+3*gsiz ) 
-muKgsize.h.cs.c.i+gsize.bs.b.W+gsiz ) 

else 

p <- muKgsize.h.ds.d.i.bs.b.M+S'gsize) 
+ mul(gsize f h,cs t c,i,bs,b,64+gsize) 
+ mul(gsize f h,ds,d,i+gsize,bs t b f 64+2 # gsize) 
+ muKgsize.h.cs.cJ+gsize.bs^.fM) 

endif 

else 

p <- mul(gsize,h l ds f d,i l bs,b,64+gsize) + muKgsize.h.cs.ai.bs.b.M) 

endif 



endcase 




case md of 


N: 








Z: 






s «- 0 h " r 


F: 






s<-0 h 


C: 






s <- 0 h " r 


endcase 




v ((as 


&Ph-l)llP) 



II -Prll P^ 1 
IIPFi-1 



if (Vh..r+fsize = (as & v r+fs ize-l) h+1 " r " fsize ) or not (I and (op = E. EXTRACT)) then 
w <_ (as & v^^^gsize-feizeKipos || VfS j 2e -i + r..r II 0 d P° s 

else 

w <- (s ? ( Vh || ~vfl slze - d P° s - 1 ) : igsize-dpos) || O dpos 

endif 

if m and (op = E. EXTRACT) then 

a$ize-1+Li «- Cgsize-1+Ldpos+fsize+i II Wdpos+fsize-L.dpos II c<jpos-1+1..i 

else 

asize-1+i..i^-w 

endif 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none * — . 

Fig. 44G (cont) 



X.DEP0SIT.2 


Crossbar deposit signed pecks 


X.DEP0SIT.4 


Crossbar deposit signed nibbles 


X.DEP0SIT.8 


Crossbar deposit signed bytes 


X.DEP0SIT.16 


Crossbar deposit signed doublets 


X.DEPOSIT.32 


Crossbar deposit signed quadlets 


XDEPOSIT.64 


Crossbar deposit signed octlets j 


X.DEPOSIT.128 


Crossbar deposit signed hexlet i 


X.DEP0SIT.U.2 


Crossbar deposit unsigned pecks 


X.DEP0SIT.U.4 


Crossbar deposit unsigned nibbles 


X.DEP0SIT.U.8 


Crossbar deposit unsigned bytes 


X.DEP0SIT.U.16 


Crossbar deposit unsigned doublets 


X.DEPOSIT.U.32 


Crossbar deposit unsigned quadlets 


X.DEPOSIT.U.64 


Crossbar deposit unsigned octlets 


X.DEPOSIT.U.128 


Crossbar deposit unsigned hexlet 


X.WITHDRAW.U.2 


Crossbar withdraw unsigned pecks 


X.WITHDRAW.U.4 


Crossbar withdraw unsigned nibbles 


X.WITHDRAW.U.8 


Crossbar withdraw unsigned bytes 


X.WITHDRAW.U. 1 6 


Crossbar withdraw unsigned doublets 


X.WITHDRAW.U.32 


Crossbar withdraw unsigned quadlets 


X.WITHDRAW.U.64 


Crossbar withdraw unsigned octlets 


X.WITHDRAW.U.128 


Crossbar withdraw unsigned hexlet 


X.WITHDRAW.2 


Crossbar withdraw pecks 


X.WITHDRAW.4 


Crossbar withdraw nibbles 


X.WITHDRAW.8 


Crossbar withdraw bytes 


X.WITHDRAW.16 


Crossbar withdraw doublets 


X.WITHDRAW.32 


Crossbar withdraw quadlets 


X.WITHDRAW.64 


Crossbar withdraw octlets 


X.WITHDRAW.1 28 


Crossbar withdraw hexlet 



Fig. 45A 



Equivalenci s 



XSEXI.2 


Crossbar extend immediate signed pecks 


X.SEX.1.4 


Crossbar extend immediate signed nibbles 


XSEXI.8 


Crossbar extend immediate signed bytes 


XSEXI.16 


Crossbar extend immediate signed doublets 


X.SEXI.32 


Crossbar extend immediate signed quadlets 


XSEX.1.64 


Crossbar extend immediate signed octlets i 


X.SEXI.128 


Crossbar extend immediate signed hexlet 


X.ZEX.1.2 


Crossbar extend immediate unsigned pecks 


XZEX.1.4 


Crossbar extend immediate unsigned nibbles 


XZEX.1.8 


Crossbar extend immediate unsigned bytes 


XZEX.1.16 


Crossbar extend immediate unsigned doublets 


XZEXI.32 


Crossbar extend immediate unsigned quadlets 


XZEXI.64 


Crossbar extend immediate unsigned octlets 


XZEXI.128 


Crossbar extend immediate unsigned hexlet 



X.SHLI.gsize rd-rc,i 


-> 


X.DEPOSIT.gsize rd=rc,size-i,i 


X.SHR.I.gsize rd=rc,i 


-> 


X.WITHDRAW.gsize rd=rc,size-i,i 


XSHRU.I.gsize rd=rc,i 


-> 


X.WITHDRAW.U.gsize rd=rc,size-i,i 


X.SEX.I.gsize rd=rc,i 


-> 


X.DEPOSIT.gsize rd=rc,i,0 


X.ZEX.I.gsize rd=rc,i 




XDEPOSIT.U.gsize rd=rc,i,0 


Redundancies 


X.DEPOSIT.gsize rd-rc,gsize,0 


<=> 


X.COPY rd=rc 


XDEPOSIT.U.gsize rd=rc,gsize,0 


<=> 


X.COPY rd=rc 


X. WITHDRA W.gsize rd=rc,gsize, 0 


<=> 


X.COPY rd=rc 


XWITHDRAW.U.gsize rd-rc,gsize,0 


<=> 


X.COPY rd=rc 



Fig. 45A (cont'd) 



Format 



X.op.gsize rd=rc,isize,ishift 
rd=xopgsize(rc,isize,ishift) 

31 26252423 18 17 1211 65 0 

I op I ih | rd 1 rc | gsfp 1 gsfs I 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs 4- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 

Fig. 45B 



Definition 

def CrossbarFieldfop.rd.rc.gsfp.gsfs) as 
c 4- RegRead(rc, 128) 
case ((opi || gsfp) and (opo || gsfs)) of 



0..63: 






gsize 


<- 


128 


64..95: 






gsize 


<- 


64 


96.. 111: 






gsize 


<— 


32 


112..119: 






gsize 


<- 


16 


120..123: 






gsize 


<r- 


8 


124..125: 






gsize 


<— 


4 


126: 






gsize 


<- 


2 


127: 







raise Reserved Instruction 

endcase 

ishift <- (opi || gsfp) and (gsize-1 ) 
isize <- ((opo || gsfs) and (gsize-1 ))+1 
if (ishift+isize>gsize) 

raise Reservedlnstruction 

end if 

case op of 

X.DEPOSIT: 

for i 0 to 128-gsize by gsize 

a i+g size-1.J «- cgsizensjze-ishift „ q+jsi2e . 1 j || O^hift 

endfor 
X.DEPOSIT.U: 

for i <- 0 to 128-gsize by gsize 

ai + gsize-1..i <- OOsize-isize-ishift „ Cj+jsj2eM . „ 0 ishift 

endfor 
X.WITHDRAW: 

for i <- 0 to 128-gsize by gsize 

aj+gsize-1..i +~ cflf s ^i?ihift-1 II c i+isize+ishift-1..i+ishift 
endfor 
X.WITHDRAW.U: 

for i <— 0 to 128-gsize by gsize 

3i+gsize-1..i «- 09 size - isize || Cj+j S ize+ishift-1..i+ishift 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved instruction 

Fig. 45C 





127 














ih,| | gsfp 














0 
















0 


ih 0 | 


gsfs 


127 



encoding for crossbar field 
Fig. 45D 



< — foizo > 




«« — fstze — > < dpo3 
crossbar deposit ~~ 

Fig. 45E 



< — fsizo — x — opoo 




< f3ize — ► 
crossbar withdraw ~™~ 



Fig. 45F 



Operation codes 



X.DEPOSIT.M.2 


Crossbar deposit merge pecks 


X.DEPOSIT.M.4 


Crossbar deposit merge nibbles 


X.DEPOSIT.M.8 


Crossbar deposit merge bytes 


X.DEPOSIT.M.16 


Crossbar deposit merge doublets 


X.DEPOSIT.M.32 


Crossbar deposit merge quadlets 


X.DEPOSIT.M.64 


Crossbar deposit merge octlets 


X.DEPOSIT.M.128 


Crossbar deposit merge hexlet 



Fig 45G 



Format 



X.op.gsize rd@rc,isize,ishift 
rd=xopgsize(rd,rc,isize,ishift) 

31 26252423 1817 1211 65 0 

I op I ih 1 rd | rc I gsfp I gsfs | 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs <- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 



Fig 45H 



D fmition 

def CrossbarFieldlnplacefop.rd.rc.gsfp.gsfs) as 
c<- RegRead(rc, 128) 
d «- RegRead(rd, 128) 
case ((opi || gsfp) and (opo || gsfs)) of 
0..63: 

gsize <- 128 
64..95: 

gsize <- 64 
96..111: 

gsize <- 32 
112..119: 

gsize <- 16 
120..123: 

gsize <- 8 
124.. 125: 

gsize <- 4 

126: 

gsize <- 2 

127: 

raise Reserved Instruction 

endcase 

ishift <- (opi || gsfp) and (gsize-1) 
isize <- ((opo || gsfs) and (gsize-1 ))+1 
if (ishift+isize>gsize) 

raise Reserved Instruction 

endif 

for i <- 0 to 128-gsize by gsize 

ai+gsize-1..i «- di+gsize-1..i+isize+ishift II c i+isize-1 ..I II dj+jshift-1 ..i 
endfor 

RegWrite(rd, 128,a) 
enddef 

Exceptions 

Reserved instruction 

Fig 45! 



< — feee — ► 




71 r - j^" a c|kvn 



Til IMS S3 



<■ — fsiz e — »« dpoa 
crossbar deposit merge 



rd 



rd 



Fig 45J 



X SHUFFLE 4 


Crossbar shuffle within Decks 

VI wwwwui wl lUlllw if ill ill l pwwiw 


X SHUFFLE 8 


Crossbar shuffle within bvtes 

WwwWwII wl lUlllw If III III 1 K/ J w\y w 


X.SHUFFLE.16 


Crossbar shuffle within doublets 


X.SHUFFLE.32 


Crossbar shuffle within quadlets - 


X.SHUFFLE.64 


Crossbar shuffle within octlets 


X.SHUFFLE.128 


Crossbar shuffle within hexlet 


X.SHUFFLE.256 


Crossbar shuffle within triclet 



Fig.46A 



Format 



X.SHUFFLE.256 rd=rc,rb,v,w,h 
X.SHUFFLE.size rd=rcb,v,w 

rd=xshuffle256(rc,rb,v,w,h) 
rd=xshufflesize(rcb,v,w) 

31 24 23 18 17 12 11 65 0 

r*xT§HUFFLE I rd | rc | rb | op | 

8 6 6 6 6 

rc <r- rb <- rcb 
x<-log2(size) 
y<-log2(v) 
z<-log2(w) 

op 4- ((x*x*x-3*x*x-4*x)/6-(z*z-z)/2+x*z+y) + (size=256)*(h*32-56) 



Fig. 46B 



Definition 



def CrossbarShufflefmajor.rd.rc.rb.op) 
c«- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
if rc=rb then 
case op of 
0..55: 

for x <- 2 to 7; for y ^ 0 to x-2; for z <- 1 to x-y-1 

if op = ((x*x*x-3*x*x-4*x)/6-(z*z-z)/2+x*z+y) then 
fori <-0to 127 

a i <~ c fl6..x II iy*z-1..y II i X -1..y+z II «y-1..o) 

end 

endif 

endfor; endfor; endfor 
56..63: 

raise Reservedlnstruction 

endcase 

elseif 

case op4..o of 
0..27: 

cb <- c || b 
x<-8 
h <- ops 

for y <- 0 to x-2; for z <- 1 to x-y-1 

if op 4 ..o = ((1 7*z-z*z)/2-8+y) then 
fori<-h*128to127+h*128 

ai-h*128 «- cbp^ y || ix .i..y + z || ^..o) 

end 

endif 
endfor, endfor 
28..31: 

raise Reservedlnstruction 

endcase 

endif 

RegWrite(rd f 128, a) 
enddef 



Exceptions 

Reserved Instruction 



Fig.46C 



127 rcb(128) o 




127 rd(128) o 



4-way shuffle bytes within hexlet 
Fig. 46D 




127 rd(128) o 



4-way shuffle bytes within triclet 
Fig. 46E 



Format 



X.SWIZZLE rd=rc,icopy,jswap 
rd=xswizzle(rc,icopy,iswap) 

31 26 2524 23 18 17 12 11 6 5 0 

["xlswiZZLE | ih | rd I rc I icopya I iswapa I 

6 2 6 6 6 6 

icopya <- icopy5..o 
iswapa <- iswaps..o 
ih <- icopy6 II iswap6 

Fig. 47A 



Definition 

def GroupSwizzlelmmediate(ih,rd,rc,icopya,iswapa) as 
icopy <- ihi || icopya 
iswap <- iho || iswapa 
c <- RegRead(rc, 128) 
fori<-0to 127 

3i *- c (i & icopy) A iswap 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 

Fig; 47B 




16-bit reverse 



Fig. 47C 



1X.SELECT.8 



| Crossbar select bytes 



Format 



op ra=rd,rc,rb 



ra=op(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 



I op | rd I rc | rb | ra 

8 6 6 6 6 

Fig. 47D 



Definition 

def CrossbarTernaryfop.rd.rc.rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
dc <- d || c 
for i<-Oto 15 

j <- b8 # j+4..8*i 

a8*i+7..8*i dcs*j+7..8*j 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 



Fig. 47E 



Pin summary 



A20M# 


I 


Address bit 20 Mask is an emulator signal. 


A31..A3 


10 


Address, in combination with byte nable, indicate the 
physical addresses of memory or device that is the target 
of a bus transaction. This signal is an output, when the 
processor is initiating the bus transaction, and an input 
when the processor is receiving an inquire transaction or 
snooping another processor's bus transaction. 


ADS# 


IO 


AD dress Strobe, when asserted, indicates new bus 
transaction by the processor, with valid address and byte 
enable simultaneously driven. 


ADSC# 


0 


Address Strobe Copy is driven identically to address 
strobe 


AHOLD 


I 


Address HOLD, when asserted, causes the processor to 
cease driving address and address parity in the next bus 
clock cycle. 


AP 


IO 


Address Parity contains even parity on the same cycle as 
address. Address parity is generated by the processor 
when address is an output, and is checked when address 
is an input. A parity error causes a bus error machine 
check. 


APCHK# 


0 


Address Parity CHecK is asserted two bus clocks after 
EADS# if address parity is not even parity of address. 


APICEN 


I 


Advanced Programmable Interrupt Controller ENable 

is not implemented. 


BE7#..BE0# 


IO 


Byte Enable indicates which bytes are the subject of a 
read or write transaction and are driven on the same cycle 
as address. 


BF1..BF0 


I 


Bus Frequency is sampled to permit software to select 
the ratio of the processor clock to the bus clock. 


BOFF# 


I 


BackOFF is sampled on the rising edge of each bus clock, 
and when asserted, the processor floats bus signals on the 
next bus clock and aborts the current bus cycle, until the 
backoff signal is sampled negated. 


BP3..BP0 


0 


Breakpoint is an emulator signal. 


BRDY# 


I 


Bus ReaDY indicates that valid data is present on data on 
a read transaction, or that data has been accepted on a 
write transaction. 


BRDYC# 


I 


Bus ReaDY Copy is identical to BRDY#; asserting either 
signal has the same effect. 


BREQ 


0 


Bus REQuest indicates a processor initiated bus request. 



Fig. 48 



BUSCHK# 


1 


BUS CH cK is sampled on the rising edge of the bus 
clock, and when asserted, causes a bus error machine 
check. 


CACHE# 


0 


CACHE, when asserted, indicates a cacheable read 
transaction or a burst write transaction. 


CLK 




bus CLocK provides the bus clock timing edge and the 
frequency reference for the processor clock. 


CPUTYP 


, 


CPU TYPe, if low indicates the primary processor, if high, 
the dual processor. 


D/C# 


1 


Data/Code is driven with the address signal to indicate 
data, code, or special cycles. 


D63..D0 


10 


Data communicates 64 bits of data per bus clock. 


D/P# 


0 


Dual/Primary is driven (asserted, low) with address on 
the primary processor 


DP7..DP0 


10 


Data Parity contains even parity on the same cycle as 
data. A parity error causes a bus error machine check. 


DPEN# 


10 


Dual Processing Enable is asserted (driven low) by a 
Dual processor at reset and sampled by a Primary 
processor at the falling edge of reset. 


EADS# 


, 


External Address Strobe indicates that an external 
device has driven address for an inquire cycle. 


EWBE# 


1 


External Write Buffer Empty indicates that the external 
system has no pending write. 


FERR# 


0 


Floating point ERRor is an emulator signal. 


FLUSH# 


1 


cache FLUSH is an emulator signal. 


FRCMC# 




Functional Redundancy Checking Master/Checker is 

not implemented. 


HIT# 


10 


HIT indicates that an inquire cycle or cache snoop hits a 
valid line. 


HITM# 


10 


HIT to a Modfied line indicates that an inquire cycle or 
cache snoop hits a sub-block in the M cache state. 


HLDA 


0 


bus HoLD Acknowlege is asserted (driven high) to 
acknowlege a bus hold request 


HOLD 


1 


bus HOLD request causes the processor to float most of 
its pins and assert bus hold acknowlege after completing 
all outstanding bus transactions, or during reset. 


IERR# 


0 


Internal ERRor is an emulator signal. 


IGNNE# 




IGNore Numeric Error is an emulator signal. 


INIT 




INITialization is an emulator signal. 


INTR 


1 

1 


maskable INTeRrupt is an emulator signal. 


INV 


1 1 


IN Validation controls whether to invalidate the addressed 
cache sub-block on an inqure transaction. 



Fig. 48 (cont'd) 



KEN# 


I 


Cach ENable is driven with address to indicate that the 
read or write transaction is cacheable. 


1 1 1 RITA 

LINT1..LINT0 


1 
1 


Local INTerrupt is not implemented. 


LOCK# 


0 


bus LOCK is driven starting with address and ending 
after bus r ady to indicate a locked series of bus 
transactions. 


M/IU# 


o 


Memory/Input Output is driven with address to indicate a 
memory or i/u transaction. 


NA# 


1 


Next Address indicates that the external system will 
accept an address for a new bus cycle in two bus clocks. 


Kl IV >l 1 

NMI 


1 

1 


Non Maskable Interrupt is an emulator signal. 


PBGNT# 


10 


Private Bus GraNT is driven between Primary and Dual 
processors to indicate that bus arbitration has completed, 
granting a new master access to the bus. 


PBKcQff 


IO 


Private Bus REQuest is driven between Primary and Dual 
processors to request a new master access to the bus. 


rULJ 


o 


Page Cache Disable is driven with address to indicate a 
not cacheable transaction. 


PCHK# 


0 


Parity CHecK is asserted (driven low) two bus clocks after 
data appears with odd parity on enabled bytes. 


PHIT# 


IO 


Pnvate HIT is driven between Pnmary and Dual 
processors to indicate that the current read or write 
transaction addresses a valid cache sub-block in the slave 
processor. 


PHITM# 


10 


Private HIT Modified is dnven between Primary and Dual 
processors to indicate that the current read or write 
transaction addresses a modified cache sub-block in the 
slave processor. 


PICCLK 


1 


Programmable Interrupt Controller CLocK is not 

implemented. 


PICD1..PICD 
U 


IO 


Programmable Interrupt Controller Data is not 

implemented. 


nrkiii 

rbNff 


1 


Parity Enable, if active on the data cycle, allows a parity 
error to cause a bus error machine check. 


rMl..rlVIU 


o 


Performance Monitoring is an emulator signal. 


□ DRV 

rKUY 


o 


Probe ReaDY is not implemented. 


D\A/X 

rW I 


o 


Page Write Through is driven with address to indicate a 
not write allocate transaction. 


R/S# 


1— 


-Run/Stop is not implemented. 




i 

1 


Ktot 1 causes a processor reset. 


SCYC 


0 


Split CYCIe is asserted during bus lock to indicate that 
more than two transactions are in the series of bus 
transactions. 



Fig. 48 (cont'd) 



Olvllrr 


1 
1 


oysiem ivianayeirieni inuurupi is an oiiiuiaior signal. 


OIVIIMO 1 ft 




oysxem managernenx mierrupi mv* i ive is an ernuiaior 

oiyildl. 




i 


w 1 Ur wLUCrV lo Oil dllUlcUUI oiy Ileal. 


TCVC 


i 


TpqI PI nrK fnllnwc IFFF 114Q 1 

I C9l wLUCrX lOIIOWo ICC.Q I Ify. 1 . 


Till 


i 


Toct Rata Inniit fnllnwc IPPP 1 1AQ 1 
I6SI Uclia inpUl lOIIOWo luCC I Ifa. I. 


Tnn 


n 

V-/ 


Toc# riata Oiitnut frklln\A/c IPPP 114Q 1 

i esi L/aia vsuipui follows iccc i i . 


TMO 
1 IVIO 


1 

1 


Toot MaHa C Aloof fnlln\A/c IPPP 1 1 AQ 1 

1 ©si iviouo oeieci 1 ono Wo iccc i it*?, i . 


1 rxO 1 rr 


1 

1 


Toe* QaCaT fnllnvA/c IPPP 11 AO 1 

i ©si r\60u i loiiows icccz i i*f%7. i. 


VCC2 


1 


VCCof2.8V at 25 pins 


VVyl^rO 


1 
1 


\/pp O OX/ a 4 Oft nine 

voir or o.ov ax pins 


VCC2DET# 


0 


VCC2 DETect sets appropriate VCC2 voltage level. 


voo 


1 
1 


\/CQ ci mr\lio/*4 of nine 

voo supplied a\ do pins 


W/R# 


0 


Write/Read is driven with address to indicate write vs. 
read transaction. 


WB/WT# 


1 


Write Back/Write Through is returned to indicate that 
data is permitted to be cached as write back. 



Fig. 48 (cont'd) 



Electrical Specifications 



Clock rate 


66 M 


Hz 


75 M 


Hz 


100 MHz 


133 MHz 




Parameter 


min 


max 


min 


max 


min 


max 


min 


max 


unit 


CLK frequency 


33.3 


66.7 


37.5 


75 


50 


100 




133 


MH 
z 


CLK period 


15.0 


30.0 


13.3 


26.3 


10.0 


20.0 






ns ! 


CLK high time (>2v) 


4.0 




4.0 




3.0 








ns 


CLK low time (<0.8V) 


4.0 




4.0 




3.0 








ns 


CLK rise time (0.8V->2V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK fall time (2V->0.8V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK period stability 




250 




250 




250 






P s . 



Fig. 49A 



A31..3 valid delay 


1.1 


6.3 


1.1 


4.5 


1.1 


4.0 






ns 


A31 ..3 float delay 




10.0 




7.0 




7.0 






ns 


ADS# valid delay 


1.0 


6.0 


1.0 


4.5 


A f\ 

1.0 


4.0 ! 






ns 


ADS# float delay 




10.0 




7.0 i 




7.0 






ns 


ADSC# valid delay 


1.0 ! 


7.0 


1.0 


4.5 


A f\ 

1.0 


4.0 






ns 


ADSC# float delay 




10.0 




7.0 




7.0 






ns 


AP valid delay 


1.0 


8.5 


1.0 


5.5 


1.0 


5.5 






ns 


AP float delay 




10.0 




7.0 




7.0 






ns 


APCHK# valid delay 


1.0 


8.3 


1.0 


4.5 


1.0 


4.5 






ns 


BE7..0# valid delay 


1.0 


7.0 


1.0 


4.5 


1.0 


4.0 






ns 


BE7..0# float delay 




10.0 




7.0 




7.0 






ns 


BP3..0 valid delay 


1.0 


10.0 














ns 


BREQ valid delay 


1.0 


8.0 


1.0 


4.5 


1.0 


4.0 | 






ns 


CACHE# valid delay 


1.0 


7.0 


1.0 


4.5 
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op rd=rc,rb 
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D finition 



def Load(op,rd,rc,rb) as 
case op of 

L16L, L32L, L8, L16AL, L32AL, L16B, L32B, L16AB, L32AB, 
L64L, L64AL, L64B, L64AB: 
signed <- true 

LU16L, LU32L, LU8, LU16AL, LU32AL, LU16B, LU32B, LU16AB, LU32AB, 
LU64L, LU64AL, LU64B, LU64AB: 

signed «- false 
L128L, L128AL, L128B, L128AB: 

signed <- undefined 

endcase 
case op of 
L8, LU8: 

size <- 8 

L16L, LU16L, L16AL, LU16AL, L16B, LU16B, L16AB, LU16AB: 
size <- 16 

L32L, LU32L, L32AL, LU32AL, L32B. LU32B, L32AB. LU32AB: 
size <- 32 

L64L, LU64L, L64AL, LU64AL, L64B. LU64B, L64AB, LU64AB: 

size ^ 64 

L128L, L128AL, L128B, L128AB: 

size 4- 128 

endcase 

Isize <r~ log(size) 

case op of 

L16L. LU16L, L32L, LU32L, L64L f LU64L, L128L, 
L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL: 
order <- L 

L16B, LU16B, L32B, LU32B, L64B, LU64B, L128B, 

L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 

order +- B 
L8 f LU8: 

order *- undefined 

endcase 
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c <r- RegRead(rc, 64) 

b <- RegRead(rb, 64) 

VirtAddr <- c + (b 6 6-lsize..O II 0 ,size - 3 ) 

case op of 

L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL, 
L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 
if (C|size-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

endif 

L16L, LU16L, L32L, LU32L, L64L, LU64L, L128L, 
L16B, LU16B, L32B, LU32B, L64B, LU64B, L128B: 
L8, LU8: 
endcase 

m <- LoadMemory(c,VirtAddr,size,order) 
a <- (msize-1 and signed) 1 28-size || m 
RegWrite(rd, 128, a) 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 50C (cont) 



Op rati n codes 



L.1.8 


Load immediate signed byte 


LI.16AB 


Load immediate signed doublet aligned big-endian 


LI.16.B 


Load immediate signed doublet big-endian 


LI.16.A.L 


Load immediate signed doublet aligned little-endian 


L.I.16.L 


Load immediate signed doublet little-endian 


L.I.32.A.B 


Load immediate signed quadlet aligned big-endian 


L.I.32.B 


Load immediate signed quadlet big-endian 


L.I.32.A.L 


Load immediate signed quadlet aligned little-endian 


LI.32.L 


Load immediate signed quadlet little-endian 


L.I.64.A.B 


Load immediate signed octlet aligned big-endian 


LI.64.B 


Load immediate signed octlet big-endian 


LI.64.A.L 


Load immediate signed octlet aligned little-endian 


L.I.64.L 


Load immediate signed octlet little-endian 


LI.128.A.B 


Load immediate hexlet aligned big-endian 


LI.128.B 


Load immediate hexlet big-endian 


L.I.128.A.L 


Load immediate hexlet aligned little-endian 


L.I.128.L 


Load immediate hexlet little-endian 


L.I.U.8 


Load immediate unsigned byte 


LI.U.16.A.B 


Load immediate unsigned doublet aligned big-endian 


LI.U.16.B 


Load immediate unsigned doublet big-endian 


LI.U.16.A.L 


Load immediate unsigned doublet aligned little-endian 


LI.U.16.L 


Load immediate unsigned doublet little-endian 


L.I.U.32.A.B 


Load immediate unsigned quadlet aligned big-endian 


LI.U.32.B 


Load immediate unsigned quadlet big-endian 


L.I.U.32.A.L 


Load immediate unsigned quadlet aligned little-endian I 


LI.U.32.L 


Load immediate unsigned quadlet little-endian 


L.I.U.64.A.B 


Load immediate unsigned octlet aligned big-endian 


LI.U.64.B 


Load immediate unsigned octlet big-endian 


L.I.U.64.A.L 


Load immediate unsigned octlet aligned little-endian 


LI.U.64.L 


Load immediate unsigned octlet little-endian • 



Fig. 51 A 



Selection 



number format 


type 


size 


alignment 


ordering 


signed byte 




8 






unsigned byte 


u 


8 






signed integer 




16 32 64 




L B 


signed integer aligned 




16 32 64 


A 


L B 


unsigned integer 


u 


16 32 64 




L B 


unsigned integer aligned 


u 


16 32 64 


A 


L B 1 


register 




128 




L B 


register aligned 




128 


A 


L B 



Format 



op rd=rc,offset 
rd=op(rc,offset) 

31 24 23 18 17 12 11 0 

I op | rd | rc | offset | 

8 6 6 12 
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Definition 



def Loadlmmediate(op,rd,rc,offset) as 
case op of 

LI16L, LI32L, LI8, LI16AL, LI32AL, LI16B, LI32B, LI16AB, LI32AB: 
LI64L, LI64AL, LI64B, LI64AB: 

signed «- taie 
LIU16L, LIU32L, LIU8, LIU16AL, LIU32AL, 
LIU16B, LIU32B, LIU16AB. LIU32AB: 
LIU64L, LIU64AL, LIU64B, LIU64AB: 

signed <- false 
LI128L, LI128AL, LI128B, LI128AB: 

signed «- undefined 

endcase 
case op of 

LI8, LIU8: 
size <- 8 

LI16L, LIU16L, LI16AL, LIU16AL. LI16B, LIU16B, LI16AB, LIU16AB: 
size «- 16 

LI32L, LIU32L, LI32AL, LIU32AL, LI32B, LIU32B, LI32AB, LIU32AB: 
size <- 32 

LI64L, LIU64L, LI64AL, LIU64AL, LI64B, LIU64B, LI64AB, LIU64AB 

sIzg ^ 64 

LI128L, LI128AL, LI128B, LI128AB: 

size <- 128 

endcase 

Isize <- log(size) 

case op of 

LI16L, LIU16L, LI32L, LIU32L, LI64L, LIU64L, LI128L, 
LI16AL, LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL: 
order <- LI 

LI16B, LIU16B, LI32B, LIU32B, LI64B, LIU64B, LI128B, 

LI16AB, LIU16AB, LI32AB, LIU32AB, LI64AB, LIU64AB, LI128AB: 

order <- B 
LI8, LIU8: 

order <- undefined 

endcase 
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c <- RegRead(rc, 64) 

VirtAddr <- c + (offeetffi-M» || offset || 0 lsize - 3 ) 
case op of 

LI16AL, LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL, 
LI16AB, LIU16AB, LI32AB, LIU32AB, LI64AB, LIU64AB, LI128AB: 

if (C| S ize-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

endif 

LI16L, LIU16L, LI32L, LIU32L, LI64L, LIU64L, LI128L, 
LI16B, LIU16B, LI32B, LIU32B, LI64B, LIU64B, LI128B: 
LI8, LIU8: 
endcase 

m <- LoadMemoryCcVirtAddr.size.order) 
a «- (msize-1 and signed) 1 28 ' size || m 
RegWrite(rd, 128, a) 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 51C(cont) 



Operation codes 



S.8 


Store byte 


S.16.B 


Store double big-endian 


S.16.A.B 


Store double aligned big-endian 


S.16.L 


Store double little-endian j 


S.16.A.L 


Store double aligned little-endian 1 


S.32.B 


Store quadlet big-endian 


S.32AB 


Store quadlet aligned big-endian j 


S.32.L 


Store quadlet little-endian 


S.32.A.L 


Store quadlet aligned little-endian 


S.64.B 


Store octlet big-endian 


S.64.A.B 


Store octlet aligned big-endian 


S.64.L 


Store octlet little-endian 


S.64.A.L 


Store octlet aligned little-endian 


S.128.B 


Store hexlet big-endian 


S.128.A.B 


Store hexlet aligned big-endian 


S.128.L 


Store hexlet little-endian 


S.128.A.L 


Store hexlet aligned little-endian 


S.MUX.64.A.B 


Store multiplex octlet aligned big-endian 


S.MUX.64.A.L 


Store multiplex octlet aligned little-endian 



Fig. 52A 



Selection 



number format 


op 


size 


alignment 


ordering 


byte 




8 






integer 




16 32 64 128 




L B 


integer aligned 




16 32 64 128 


A 


L B 


multiplex 


MUX 


64 


A 


L B 



Format 



op rd.rc.rb 
op(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

| S.MINOR | rd | rc | rb | op I 

8 6 6 6 6 



Fig.52B 



Definition 



def Store(op,rd,rc,rb) as 
case op of 
S8: 

size <- 8 
S16L, S16AL, S16B, S16AB: 

size <- 16 
S32L, S32AL, S32B, S32AB: 

size «- 32 
S64L. S64AL, S64B, S64AB, 
SMUX64AB, SMUX64AL: 

size <- 64 
S128L, S128AL, S128B, S128AB: 

size <- 128 

endcase 
Isize <- log(size) 
case op of 
S8: 

order <- undefined 
S16L, S32L, S64L, S128L, 
S16AL, S32AL, S64AL, S128AL, SMUX64ALI: 

order <- L 
S16B, S32B, S64B, S128B, 
S16AB, S32AB, S64AB, S128AB, SMUX64ABI: 

order B 

endcase 

c <- RegRead(rc, 64) 

b <- RegRead(rb, 64) 

VirtAddr <- c + (b 6 6-lsize..O II 0 lsize - 3 ) 

case op of 

S16AL, S32AL, S64AL, S128AL, 

S16AB, S32AB, S64AB, S128AB, 

SMUX64AB, SMUX64AL: 

if (C|size-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

endif 

S16L, S32L. S64L, S128L, 
S16B,S32B,S64B,S128B: 
S8: 
endcase 



Fig. 52C 



d <- RegRead(rd, 128) 
cas op of 
S8, 

S16L, S16AL, S16B, S16AB, 
S32L, S32AL, S32B, S32AB, 
S64L, S64AL, S64B, S64AB, 
S128L, S128AL, S128B, S128AB: 

StoreMemory(c f VirtAddr,size f order,d S i ze -i..o) 
SMUX64AB, SMUX64AL: 

lock 

a <- LoadMemoryWfc.VirtAddr.size.order) 

m +- (di27..64 & d63..o) I (a & ~d63..o) 
StoreMemorytcVirtAddr.size^rder.m) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 52C (cont) 



Operation codes 



S.1.8 


Store immediate byte 


S.I.16.A.B 


Store immediate double aligned big-endian 


S.I.16.B 


Store immediate double big-endian 


S.I.16.A.L 


Store immediate double aligned little-endian 


S.I.16.L 


Store immediate double little-endian 


S.I.32.A.B 


Store immediate quadlet aligned big-endian 


S.I.32.B 


Store immediate quadlet big-endian 


S.I.32.A.L 


Store immediate quadlet aligned little-endian 


S.I.32.L 


Store immediate quadlet little-endian 


S.I.64.A.B 


Store immediate octlet aligned big-endian 


S.I.64.B 


Store immediate octlet big-endian 


S.I.64.A.L 


Store immediate octlet aligned little-endian 


S.I.64.L 


Store immediate octlet little-endian 


S.I.128.A.B 


Store immediate hexlet aligned big-endian 


S.I.128.B 


Store immediate hexlet big-endian 


S.I.128.A.L 


Store immediate hexlet aligned little-endian 


S.I.128.L 


Store immediate hexlet little-endian 


S.MUXI.64.A.B 


Store multiplex immediate octlet aligned big-endian 


S.MUXI.64.A.L 


Store multiplex immediate octlet aligned little-endian 



Fig. 53A 



Selection 



number format 


op 


size 


alignment 


ordering 


byte 




8 






integer 




16 32 64 128 




L B 


integer aligned 




16 32 64 128 


A 


L B 


multiplex 


MUX 


64 


A 


L B 



Format 



S.op.l.size.align.order rd.rc.offset 
sopisizealignorder(rd,rc,offset) 

31 24 23 18 17 12 11 0 

I op I rd I re | offset | 

8 6 6 12 

Fig. 53B 



Definition 



def Storelmmediate(op,rd,rc,offset) as 
case op of 
SI8: 

size <- 8 
SI16L, SI16AL, SI16B, SI16AB: 

size <- 16 
SI32L, SI32AL, SI32B, SI32AB: 

size <- 32 

SI64L. SI64AL, SI64B, SI64AB, SMUXI64AB, SMUXI64AL: 

size <- 64 
SI128L, SI128AL, S1128B, SI128AB: 

size <- 128 

endcase 
Isize <r- log(size) 
case op of 
SI8: 

order <- undefined 
SI16L, SI32L, SI64L, SI128L, 
SI1 6AL, SI32AL, SI64AL, SI1 28AL, SMUXI64AL: 

order <- L 
SI16B, SI32B, SI64B, SI128B, 
SI16AB, SI32AB, SI64AB, SI128AB, SMUXI64AB: 

order <- B 

endcase 

c <- RegRead(rc, 64) 

VirtAddr <- c + (offsetf f- |slze || offset || 0 ,size - 3 ) 

case op of 

SI16AL, SI32AL, SI64AL, SI128AL, 
SI16AB, SI32AB, SI64AB, SI128AB, 
SMUXI64AB, SMUXI64AL: 
if (C| S ize-4..0 * 0 then 

raise AccessDisallowed By Virtual Address 

endif 

SI16L,SI32L,SI64L,SI128L, 
SI16B. SI32B, SI64B, SI128B: 
SI8: 
endcase 



Fig. 53C 



d <- RegRead(rd, 128) 
cas op of 
SI8, 

SI16L, SI16AL, SI16B, SI16AB, 
SI32L, SI32AL, SI32B, SI32AB, 
SI64L, SI64AL, SI64B, SI64AB, 
SI128L, SI128AL, SI128B, SI128AB: 

StoreMemory(c t VirtAddr l size f order,d S | ze .i..o) 
SMUXI64AB, SMUXI64AL: 

lock 

a <- LoadMemoryW(c,VirtAddr,size,order) 

m <- (di27..84 & C163..0) I (a & ~d63..0) 
StoreMemoryCc.VirtAddr.size.order.m) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 53C (cont) 
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